diff --git "a/8b7178b58b/3430964.out" "b/8b7178b58b/3430964.out" new file mode 100644--- /dev/null +++ "b/8b7178b58b/3430964.out" @@ -0,0 +1,51786 @@ +Model parameters: d_model 4096 ffw_size 16384 kv_size 128 n_heads 32 n_layers 42 +Megatron-DeepSpeed/pretrain_gpt.py --tensor-model-parallel-size 2 --pipeline-model-parallel-size 2 --num-layers 42 --hidden-size 4096 --num-attention-heads 32 --kv-channels 128 --ffn-hidden-size 16384 --seq-length 2048 --max-position-embeddings 2048 --micro-batch-size 1 --global-batch-size 512 --train-samples 1 --vocab-file gpt2/vocab.json --merge-file gpt2/merges.txt --clip-grad 1.0 --kill-switch-path kill-switch-8b7178b58bval --bf16 --optimizer adam --adam-beta1 0.9 --adam-beta2 0.999 --adam-eps 1e-8 --lr 2e-4 --min-lr 2e-5 --lr-decay-style cosine --lr-decay-samples 1 --lr-warmup-samples 0 --clip-grad 1.0 --weight-decay 1e-1 --override-lr-scheduler --reset-progress --no-load-optim --log-interval 10 --save-interval 5000 --eval-interval 1 --eval-iters 100 --eval-only true --tensorboard-dir tensorboard_8b7178b58bval --tensorboard-queue-size 5 --log-timers-to-tensorboard --log-batch-size-to-tensorboard --log-validation-ppl-to-tensorboard --save lm1-8b7-178b-c4-repetitions/8b7178b58b --load lm1-8b7-178b-c4-repetitions/8b7178b58b --train-weighted-split-paths-path train400m.txt --valid-weighted-split-paths-path val.txt --data-impl mmap --num-workers 0 --valid-num-workers 0 --deepspeed --deepspeed_config ds_configs/3430964.json --zero-stage 0 +START 3430964: Sat 29 Apr 2023 11:24:02 AM EEST + 0: + 0: + 0: ======================= ROCm System Management Interface ======================= + 0: ================================= Concise Info ================================= + 0: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 0: 0 41.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 2 45.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 4 48.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: 6 39.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 0: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 0: ================================================================================ + 0: ============================= End of ROCm SMI Log ============================== +61: +61: +61: ======================= ROCm System Management Interface ======================= +61: ================================= Concise Info ================================= +61: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +61: 0 47.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +61: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +61: 2 42.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +61: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +61: 4 50.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +61: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +61: 6 43.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +61: 7 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +61: ================================================================================ +61: ============================= End of ROCm SMI Log ============================== +51: +51: +51: ======================= ROCm System Management Interface ======================= +51: ================================= Concise Info ================================= +51: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +51: 0 50.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +51: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +51: 2 42.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +51: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +51: 4 48.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +51: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +51: 6 44.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +51: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +51: ================================================================================ +51: ============================= End of ROCm SMI Log ============================== +63: +63: +63: ======================= ROCm System Management Interface ======================= +63: ================================= Concise Info ================================= +63: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +63: 0 49.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +63: 1 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +63: 2 42.0c 81.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +63: 3 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +63: 4 40.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +63: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +63: 6 36.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +63: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +63: ================================================================================ +63: ============================= End of ROCm SMI Log ============================== +57: +57: +57: ======================= ROCm System Management Interface ======================= +57: ================================= Concise Info ================================= +57: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +57: 0 50.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +57: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +57: 2 44.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +57: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +57: 4 53.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +57: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +57: 6 41.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +57: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +57: ================================================================================ +57: ============================= End of ROCm SMI Log ============================== +59: +59: +59: ======================= ROCm System Management Interface ======================= +59: ================================= Concise Info ================================= +59: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +59: 0 49.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +59: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +59: 2 42.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +59: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +59: 4 44.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +59: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +59: 6 40.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +59: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +59: ================================================================================ +59: ============================= End of ROCm SMI Log ============================== +13: +13: +13: ======================= ROCm System Management Interface ======================= +13: ================================= Concise Info ================================= +13: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +13: 0 45.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 2 36.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 4 40.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 5 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: 6 41.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +13: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +13: ================================================================================ +13: ============================= End of ROCm SMI Log ============================== +58: +58: +58: ======================= ROCm System Management Interface ======================= +58: ================================= Concise Info ================================= +58: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +58: 0 54.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +58: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +58: 2 44.0c 101.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +58: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +58: 4 45.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +58: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +58: 6 41.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +58: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +58: ================================================================================ +58: ============================= End of ROCm SMI Log ============================== +27: +27: +27: ======================= ROCm System Management Interface ======================= +27: ================================= Concise Info ================================= +27: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +27: 0 46.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 2 45.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 4 45.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: 6 41.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +27: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +27: ================================================================================ +27: ============================= End of ROCm SMI Log ============================== +22: +22: +22: ======================= ROCm System Management Interface ======================= +22: ================================= Concise Info ================================= +22: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +22: 0 46.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 2 39.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 4 44.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: 6 43.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +22: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +22: ================================================================================ +22: ============================= End of ROCm SMI Log ============================== +25: +25: +25: ======================= ROCm System Management Interface ======================= +25: ================================= Concise Info ================================= +25: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +25: 0 42.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 1 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 2 38.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 4 35.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: 6 47.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +25: 7 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +25: ================================================================================ +25: ============================= End of ROCm SMI Log ============================== +18: +18: +18: ======================= ROCm System Management Interface ======================= +18: ================================= Concise Info ================================= +18: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +18: 0 42.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 2 43.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 4 44.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: 6 42.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +18: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +18: ================================================================================ +18: ============================= End of ROCm SMI Log ============================== +17: +17: +17: ======================= ROCm System Management Interface ======================= +17: ================================= Concise Info ================================= +17: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +17: 0 43.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 2 44.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 4 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: 6 40.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +17: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +17: ================================================================================ +17: ============================= End of ROCm SMI Log ============================== +24: +24: +24: ======================= ROCm System Management Interface ======================= +24: ================================= Concise Info ================================= +24: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +24: 0 45.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 2 42.0c 100.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 4 44.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: 6 44.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +24: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +24: ================================================================================ +24: ============================= End of ROCm SMI Log ============================== +46: +46: +46: ======================= ROCm System Management Interface ======================= +46: ================================= Concise Info ================================= +46: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +46: 0 44.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +46: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +46: 2 42.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +46: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +46: 4 44.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +46: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +46: 6 44.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +46: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +46: ================================================================================ +46: ============================= End of ROCm SMI Log ============================== +34: +34: +34: ======================= ROCm System Management Interface ======================= +34: ================================= Concise Info ================================= +34: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +34: 0 51.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +34: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +34: 2 46.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +34: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +34: 4 47.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +34: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +34: 6 41.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +34: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +34: ================================================================================ +34: ============================= End of ROCm SMI Log ============================== +12: +12: +12: ======================= ROCm System Management Interface ======================= +12: ================================= Concise Info ================================= +12: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +12: 0 45.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 1 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 2 44.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 4 41.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: 6 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +12: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +12: ================================================================================ +12: ============================= End of ROCm SMI Log ============================== +54: +54: +54: ======================= ROCm System Management Interface ======================= +54: ================================= Concise Info ================================= +54: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +54: 0 48.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +54: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +54: 2 40.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +54: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +54: 4 50.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +54: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +54: 6 42.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +54: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +54: ================================================================================ +54: ============================= End of ROCm SMI Log ============================== + 3: + 3: + 3: ======================= ROCm System Management Interface ======================= + 3: ================================= Concise Info ================================= + 3: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 3: 0 40.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 1 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 2 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 4 43.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: 6 41.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 3: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 3: ================================================================================ + 3: ============================= End of ROCm SMI Log ============================== +47: +47: +47: ======================= ROCm System Management Interface ======================= +47: ================================= Concise Info ================================= +47: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +47: 0 50.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +47: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +47: 2 44.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +47: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +47: 4 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +47: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +47: 6 44.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +47: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +47: ================================================================================ +47: ============================= End of ROCm SMI Log ============================== +37: +37: +37: ======================= ROCm System Management Interface ======================= +37: ================================= Concise Info ================================= +37: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +37: 0 46.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +37: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +37: 2 41.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +37: 3 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +37: 4 44.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +37: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +37: 6 41.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +37: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +37: ================================================================================ +37: ============================= End of ROCm SMI Log ============================== +41: +41: +41: ======================= ROCm System Management Interface ======================= +41: ================================= Concise Info ================================= +41: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +41: 0 48.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +41: 1 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +41: 2 46.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +41: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +41: 4 49.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +41: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +41: 6 45.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +41: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +41: ================================================================================ +41: ============================= End of ROCm SMI Log ============================== +48: +48: +48: ======================= ROCm System Management Interface ======================= +48: ================================= Concise Info ================================= +48: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +48: 0 48.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +48: 1 53.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +48: 2 42.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +48: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +48: 4 48.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +48: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +48: 6 40.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +48: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +48: ================================================================================ +48: ============================= End of ROCm SMI Log ============================== +33: +33: +33: ======================= ROCm System Management Interface ======================= +33: ================================= Concise Info ================================= +33: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +33: 0 52.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +33: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +33: 2 40.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +33: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +33: 4 45.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +33: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +33: 6 45.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +33: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +33: ================================================================================ +33: ============================= End of ROCm SMI Log ============================== +53: +53: +53: ======================= ROCm System Management Interface ======================= +53: ================================= Concise Info ================================= +53: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +53: 0 48.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +53: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +53: 2 43.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +53: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +53: 4 44.0c 100.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +53: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +53: 6 40.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +53: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +53: ================================================================================ +53: ============================= End of ROCm SMI Log ============================== +10: +10: +10: ======================= ROCm System Management Interface ======================= +10: ================================= Concise Info ================================= +10: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +10: 0 46.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 1 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 2 38.0c 81.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 4 43.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: 6 43.0c 81.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +10: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +10: ================================================================================ +10: ============================= End of ROCm SMI Log ============================== + 8: + 8: + 8: ======================= ROCm System Management Interface ======================= + 8: ================================= Concise Info ================================= + 8: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 8: 0 47.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 2 39.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 4 44.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: 6 39.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 8: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 8: ================================================================================ + 8: ============================= End of ROCm SMI Log ============================== +56: +56: +56: ======================= ROCm System Management Interface ======================= +56: ================================= Concise Info ================================= +56: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +56: 0 46.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +56: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +56: 2 42.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +56: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +56: 4 43.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +56: 5 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +56: 6 45.0c 81.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +56: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +56: ================================================================================ +56: ============================= End of ROCm SMI Log ============================== +44: +44: +44: ======================= ROCm System Management Interface ======================= +44: ================================= Concise Info ================================= +44: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +44: 0 45.0c 98.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +44: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +44: 2 38.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +44: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +44: 4 50.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +44: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +44: 6 42.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +44: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +44: ================================================================================ +44: ============================= End of ROCm SMI Log ============================== +55: +55: +55: ======================= ROCm System Management Interface ======================= +55: ================================= Concise Info ================================= +55: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +55: 0 42.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +55: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +55: 2 46.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +55: 3 38.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +55: 4 43.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +55: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +55: 6 40.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +55: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +55: ================================================================================ +55: ============================= End of ROCm SMI Log ============================== +20: +20: +20: ======================= ROCm System Management Interface ======================= +20: ================================= Concise Info ================================= +20: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +20: 0 47.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 2 38.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 3 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 4 42.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: 6 39.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +20: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +20: ================================================================================ +20: ============================= End of ROCm SMI Log ============================== +28: +28: +28: ======================= ROCm System Management Interface ======================= +28: ================================= Concise Info ================================= +28: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +28: 0 55.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 2 39.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 3 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 4 39.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: 6 39.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +28: 7 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +28: ================================================================================ +28: ============================= End of ROCm SMI Log ============================== +19: +19: +19: ======================= ROCm System Management Interface ======================= +19: ================================= Concise Info ================================= +19: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +19: 0 42.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 2 40.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 4 41.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: 6 45.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +19: 7 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +19: ================================================================================ +19: ============================= End of ROCm SMI Log ============================== +38: +38: +38: ======================= ROCm System Management Interface ======================= +38: ================================= Concise Info ================================= +38: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +38: 0 48.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +38: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +38: 2 40.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +38: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +38: 4 45.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +38: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +38: 6 46.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +38: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +38: ================================================================================ +38: ============================= End of ROCm SMI Log ============================== + 5: + 5: + 5: ======================= ROCm System Management Interface ======================= + 5: ================================= Concise Info ================================= + 5: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 5: 0 42.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 2 45.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 4 45.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: 6 50.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 5: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 5: ================================================================================ + 5: ============================= End of ROCm SMI Log ============================== +35: +35: +35: ======================= ROCm System Management Interface ======================= +35: ================================= Concise Info ================================= +35: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +35: 0 43.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +35: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +35: 2 42.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +35: 3 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +35: 4 44.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +35: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +35: 6 45.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +35: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +35: ================================================================================ +35: ============================= End of ROCm SMI Log ============================== +60: +60: +60: ======================= ROCm System Management Interface ======================= +60: ================================= Concise Info ================================= +60: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +60: 0 41.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +60: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +60: 2 43.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +60: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +60: 4 44.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +60: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +60: 6 49.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +60: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +60: ================================================================================ +60: ============================= End of ROCm SMI Log ============================== +42: +42: +42: ======================= ROCm System Management Interface ======================= +42: ================================= Concise Info ================================= +42: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +42: 0 47.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +42: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +42: 2 46.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +42: 3 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +42: 4 49.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +42: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +42: 6 44.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +42: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +42: ================================================================================ +42: ============================= End of ROCm SMI Log ============================== +30: +30: +30: ======================= ROCm System Management Interface ======================= +30: ================================= Concise Info ================================= +30: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +30: 0 45.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 1 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 2 45.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 3 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 4 44.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: 6 44.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +30: 7 52.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +30: ================================================================================ +30: ============================= End of ROCm SMI Log ============================== + 2: + 2: + 2: ======================= ROCm System Management Interface ======================= + 2: ================================= Concise Info ================================= + 2: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 2: 0 48.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 2 41.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 4 40.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: 6 37.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 2: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 2: ================================================================================ + 2: ============================= End of ROCm SMI Log ============================== + 1: + 1: + 1: ======================= ROCm System Management Interface ======================= + 1: ================================= Concise Info ================================= + 1: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 1: 0 52.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 1 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 2 42.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 4 45.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 5 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: 6 34.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 1: 7 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 1: ================================================================================ + 1: ============================= End of ROCm SMI Log ============================== +21: +21: +21: ======================= ROCm System Management Interface ======================= +21: ================================= Concise Info ================================= +21: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +21: 0 44.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 2 43.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 3 40.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 4 44.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: 6 44.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +21: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +21: ================================================================================ +21: ============================= End of ROCm SMI Log ============================== +43: +43: +43: ======================= ROCm System Management Interface ======================= +43: ================================= Concise Info ================================= +43: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +43: 0 42.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +43: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +43: 2 43.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +43: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +43: 4 44.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +43: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +43: 6 39.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +43: 7 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +43: ================================================================================ +43: ============================= End of ROCm SMI Log ============================== +29: +29: +29: ======================= ROCm System Management Interface ======================= +29: ================================= Concise Info ================================= +29: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +29: 0 49.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 2 44.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 4 44.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 5 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: 6 44.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +29: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +29: ================================================================================ +29: ============================= End of ROCm SMI Log ============================== +62: +62: +62: ======================= ROCm System Management Interface ======================= +62: ================================= Concise Info ================================= +62: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +62: 0 53.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +62: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +62: 2 47.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +62: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +62: 4 46.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +62: 5 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +62: 6 50.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +62: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +62: ================================================================================ +62: ============================= End of ROCm SMI Log ============================== +15: +15: +15: ======================= ROCm System Management Interface ======================= +15: ================================= Concise Info ================================= +15: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +15: 0 48.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 2 46.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 4 40.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: 6 38.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +15: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +15: ================================================================================ +15: ============================= End of ROCm SMI Log ============================== + 4: + 4: + 4: ======================= ROCm System Management Interface ======================= + 4: ================================= Concise Info ================================= + 4: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 4: 0 42.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 2 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 4 41.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: 6 41.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 4: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 4: ================================================================================ + 4: ============================= End of ROCm SMI Log ============================== +49: +49: +49: ======================= ROCm System Management Interface ======================= +49: ================================= Concise Info ================================= +49: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +49: 0 45.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +49: 1 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +49: 2 49.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +49: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +49: 4 47.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +49: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +49: 6 42.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +49: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +49: ================================================================================ +49: ============================= End of ROCm SMI Log ============================== +16: +16: +16: ======================= ROCm System Management Interface ======================= +16: ================================= Concise Info ================================= +16: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +16: 0 47.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 2 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 3 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 4 40.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: 6 42.0c 82.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +16: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +16: ================================================================================ +16: ============================= End of ROCm SMI Log ============================== + 9: + 9: + 9: ======================= ROCm System Management Interface ======================= + 9: ================================= Concise Info ================================= + 9: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 9: 0 46.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 2 43.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 3 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 4 42.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 5 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: 6 40.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 9: 7 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 9: ================================================================================ + 9: ============================= End of ROCm SMI Log ============================== +50: +50: +50: ======================= ROCm System Management Interface ======================= +50: ================================= Concise Info ================================= +50: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +50: 0 50.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +50: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +50: 2 45.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +50: 3 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +50: 4 44.0c 81.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +50: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +50: 6 37.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +50: 7 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +50: ================================================================================ +50: ============================= End of ROCm SMI Log ============================== +14: +14: +14: ======================= ROCm System Management Interface ======================= +14: ================================= Concise Info ================================= +14: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +14: 0 50.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 1 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 2 42.0c 97.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 4 45.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: 6 49.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +14: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +14: ================================================================================ +14: ============================= End of ROCm SMI Log ============================== +36: +36: +36: ======================= ROCm System Management Interface ======================= +36: ================================= Concise Info ================================= +36: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +36: 0 48.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +36: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +36: 2 45.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +36: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +36: 4 42.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +36: 5 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +36: 6 47.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +36: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +36: ================================================================================ +36: ============================= End of ROCm SMI Log ============================== +26: +26: +26: ======================= ROCm System Management Interface ======================= +26: ================================= Concise Info ================================= +26: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +26: 0 49.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 2 37.0c 89.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 4 38.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 5 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: 6 38.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +26: 7 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +26: ================================================================================ +26: ============================= End of ROCm SMI Log ============================== +23: +23: +23: ======================= ROCm System Management Interface ======================= +23: ================================= Concise Info ================================= +23: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +23: 0 46.0c 88.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 2 39.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 4 39.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: 6 40.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +23: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +23: ================================================================================ +23: ============================= End of ROCm SMI Log ============================== +40: +40: +40: ======================= ROCm System Management Interface ======================= +40: ================================= Concise Info ================================= +40: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +40: 0 46.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +40: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +40: 2 37.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +40: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +40: 4 44.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +40: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +40: 6 41.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +40: 7 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +40: ================================================================================ +40: ============================= End of ROCm SMI Log ============================== +11: +11: +11: ======================= ROCm System Management Interface ======================= +11: ================================= Concise Info ================================= +11: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +11: 0 37.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 2 36.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 3 39.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 4 43.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 5 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: 6 38.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +11: 7 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +11: ================================================================================ +11: ============================= End of ROCm SMI Log ============================== +39: +39: +39: ======================= ROCm System Management Interface ======================= +39: ================================= Concise Info ================================= +39: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +39: 0 47.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +39: 1 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +39: 2 51.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +39: 3 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +39: 4 37.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +39: 5 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +39: 6 46.0c 81.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +39: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +39: ================================================================================ +39: ============================= End of ROCm SMI Log ============================== + 7: + 7: + 7: ======================= ROCm System Management Interface ======================= + 7: ================================= Concise Info ================================= + 7: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 7: 0 44.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 2 38.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 4 43.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 5 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: 6 44.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 7: 7 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 7: ================================================================================ + 7: ============================= End of ROCm SMI Log ============================== +52: +52: +52: ======================= ROCm System Management Interface ======================= +52: ================================= Concise Info ================================= +52: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +52: 0 45.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +52: 1 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +52: 2 40.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +52: 3 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +52: 4 39.0c 87.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +52: 5 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +52: 6 42.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +52: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +52: ================================================================================ +52: ============================= End of ROCm SMI Log ============================== + 6: + 6: + 6: ======================= ROCm System Management Interface ======================= + 6: ================================= Concise Info ================================= + 6: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% + 6: 0 47.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 1 43.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 2 39.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 3 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 4 41.0c 85.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: 6 41.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% + 6: 7 42.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% + 6: ================================================================================ + 6: ============================= End of ROCm SMI Log ============================== +32: +32: +32: ======================= ROCm System Management Interface ======================= +32: ================================= Concise Info ================================= +32: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +32: 0 49.0c 90.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +32: 1 49.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +32: 2 45.0c 86.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +32: 3 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +32: 4 54.0c 95.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +32: 5 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +32: 6 42.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +32: 7 50.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +32: ================================================================================ +32: ============================= End of ROCm SMI Log ============================== +31: +31: +31: ======================= ROCm System Management Interface ======================= +31: ================================= Concise Info ================================= +31: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +31: 0 49.0c 91.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 1 48.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 2 46.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 3 41.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 4 45.0c 92.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 5 51.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: 6 44.0c 94.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +31: 7 46.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +31: ================================================================================ +31: ============================= End of ROCm SMI Log ============================== +45: +45: +45: ======================= ROCm System Management Interface ======================= +45: ================================= Concise Info ================================= +45: GPU Temp AvgPwr SCLK MCLK Fan Perf PwrCap VRAM% GPU% +45: 0 48.0c 93.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +45: 1 44.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +45: 2 39.0c 96.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +45: 3 47.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +45: 4 43.0c 84.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +45: 5 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +45: 6 37.0c 83.0W 800Mhz 1600Mhz 0% auto 560.0W 0% 0% +45: 7 45.0c N/A 800Mhz 1600Mhz 0% auto 0.0W 0% 0% +45: ================================================================================ +45: ============================= End of ROCm SMI Log ============================== +47: Launching on nid006792 (47/64), master nid006071 port 9999, GPUs 8, CUDA: True +18: Launching on nid006089 (18/64), master nid006071 port 9999, GPUs 8, CUDA: True +61: Launching on nid006806 (61/64), master nid006071 port 9999, GPUs 8, CUDA: True + 0: Launching on nid006071 (0/64), master nid006071 port 9999, GPUs 8, CUDA: True +42: Launching on nid006787 (42/64), master nid006071 port 9999, GPUs 8, CUDA: True + 3: Launching on nid006074 (3/64), master nid006071 port 9999, GPUs 8, CUDA: True +44: Launching on nid006789 (44/64), master nid006071 port 9999, GPUs 8, CUDA: True +55: Launching on nid006800 (55/64), master nid006071 port 9999, GPUs 8, CUDA: True +25: Launching on nid006096 (25/64), master nid006071 port 9999, GPUs 8, CUDA: True +22: Launching on nid006093 (22/64), master nid006071 port 9999, GPUs 8, CUDA: True +17: Launching on nid006088 (17/64), master nid006071 port 9999, GPUs 8, CUDA: True +58: Launching on nid006803 (58/64), master nid006071 port 9999, GPUs 8, CUDA: True +23: Launching on nid006094 (23/64), master nid006071 port 9999, GPUs 8, CUDA: True +12: Launching on nid006083 (12/64), master nid006071 port 9999, GPUs 8, CUDA: True +29: Launching on nid006774 (29/64), master nid006071 port 9999, GPUs 8, CUDA: True +63: Launching on nid006808 (63/64), master nid006071 port 9999, GPUs 8, CUDA: True + 1: Launching on nid006072 (1/64), master nid006071 port 9999, GPUs 8, CUDA: True +16: Launching on nid006087 (16/64), master nid006071 port 9999, GPUs 8, CUDA: True +56: Launching on nid006801 (56/64), master nid006071 port 9999, GPUs 8, CUDA: True + 2: Launching on nid006073 (2/64), master nid006071 port 9999, GPUs 8, CUDA: True +13: Launching on nid006084 (13/64), master nid006071 port 9999, GPUs 8, CUDA: True +37: Launching on nid006782 (37/64), master nid006071 port 9999, GPUs 8, CUDA: True +27: Launching on nid006772 (27/64), master nid006071 port 9999, GPUs 8, CUDA: True +60: Launching on nid006805 (60/64), master nid006071 port 9999, GPUs 8, CUDA: True +34: Launching on nid006779 (34/64), master nid006071 port 9999, GPUs 8, CUDA: True +43: Launching on nid006788 (43/64), master nid006071 port 9999, GPUs 8, CUDA: True +59: Launching on nid006804 (59/64), master nid006071 port 9999, GPUs 8, CUDA: True +41: Launching on nid006786 (41/64), master nid006071 port 9999, GPUs 8, CUDA: True +33: Launching on nid006778 (33/64), master nid006071 port 9999, GPUs 8, CUDA: True + 5: Launching on nid006076 (5/64), master nid006071 port 9999, GPUs 8, CUDA: True + 9: Launching on nid006080 (9/64), master nid006071 port 9999, GPUs 8, CUDA: True +26: Launching on nid006097 (26/64), master nid006071 port 9999, GPUs 8, CUDA: True +62: Launching on nid006807 (62/64), master nid006071 port 9999, GPUs 8, CUDA: True +48: Launching on nid006793 (48/64), master nid006071 port 9999, GPUs 8, CUDA: True +51: Launching on nid006796 (51/64), master nid006071 port 9999, GPUs 8, CUDA: True +19: Launching on nid006090 (19/64), master nid006071 port 9999, GPUs 8, CUDA: True +54: Launching on nid006799 (54/64), master nid006071 port 9999, GPUs 8, CUDA: True +57: Launching on nid006802 (57/64), master nid006071 port 9999, GPUs 8, CUDA: True +30: Launching on nid006775 (30/64), master nid006071 port 9999, GPUs 8, CUDA: True +38: Launching on nid006783 (38/64), master nid006071 port 9999, GPUs 8, CUDA: True +10: Launching on nid006081 (10/64), master nid006071 port 9999, GPUs 8, CUDA: True +15: Launching on nid006086 (15/64), master nid006071 port 9999, GPUs 8, CUDA: True +14: Launching on nid006085 (14/64), master nid006071 port 9999, GPUs 8, CUDA: True +35: Launching on nid006780 (35/64), master nid006071 port 9999, GPUs 8, CUDA: True +46: Launching on nid006791 (46/64), master nid006071 port 9999, GPUs 8, CUDA: True +28: Launching on nid006773 (28/64), master nid006071 port 9999, GPUs 8, CUDA: True +53: Launching on nid006798 (53/64), master nid006071 port 9999, GPUs 8, CUDA: True +24: Launching on nid006095 (24/64), master nid006071 port 9999, GPUs 8, CUDA: True + 8: Launching on nid006079 (8/64), master nid006071 port 9999, GPUs 8, CUDA: True +21: Launching on nid006092 (21/64), master nid006071 port 9999, GPUs 8, CUDA: True + 4: Launching on nid006075 (4/64), master nid006071 port 9999, GPUs 8, CUDA: True +20: Launching on nid006091 (20/64), master nid006071 port 9999, GPUs 8, CUDA: True +36: Launching on nid006781 (36/64), master nid006071 port 9999, GPUs 8, CUDA: True +49: Launching on nid006794 (49/64), master nid006071 port 9999, GPUs 8, CUDA: True +40: Launching on nid006785 (40/64), master nid006071 port 9999, GPUs 8, CUDA: True + 7: Launching on nid006078 (7/64), master nid006071 port 9999, GPUs 8, CUDA: True + 6: Launching on nid006077 (6/64), master nid006071 port 9999, GPUs 8, CUDA: True +50: Launching on nid006795 (50/64), master nid006071 port 9999, GPUs 8, CUDA: True +45: Launching on nid006790 (45/64), master nid006071 port 9999, GPUs 8, CUDA: True +11: Launching on nid006082 (11/64), master nid006071 port 9999, GPUs 8, CUDA: True +32: Launching on nid006777 (32/64), master nid006071 port 9999, GPUs 8, CUDA: True +31: Launching on nid006776 (31/64), master nid006071 port 9999, GPUs 8, CUDA: True +52: Launching on nid006797 (52/64), master nid006071 port 9999, GPUs 8, CUDA: True +39: Launching on nid006784 (39/64), master nid006071 port 9999, GPUs 8, CUDA: True +63: > setting tensorboard ... + 0: using world size: 512, data-parallel-size: 128, tensor-model-parallel size: 2, pipeline-model-parallel size: 2 + 0: accumulate and all-reduce gradients in fp32 for bfloat16 data type. + 0: using torch.bfloat16 for parameters ... + 0: ------------------------ arguments ------------------------ + 0: abort_on_unmet_fused_kernel_constraints ......... False + 0: accumulate_allreduce_grads_in_fp32 .............. True + 0: adam_beta1 ...................................... 0.9 + 0: adam_beta2 ...................................... 0.999 + 0: adam_eps ........................................ 1e-08 + 0: adlr_autoresume ................................. False + 0: adlr_autoresume_interval ........................ 1000 + 0: apply_query_key_layer_scaling ................... True + 0: apply_residual_connection_post_layernorm ........ False + 0: attention_dropout ............................... 0.1 + 0: attention_softmax_in_fp32 ....................... False + 0: bert_binary_head ................................ True + 0: bert_load ....................................... None + 0: bf16 ............................................ True + 0: bias_dropout_fusion ............................. True + 0: bias_gelu_fusion ................................ True + 0: biencoder_projection_dim ........................ 0 + 0: biencoder_shared_query_context_model ............ False + 0: block_data_path ................................. None + 0: checkpoint_activations .......................... False + 0: checkpoint_in_cpu ............................... False + 0: checkpoint_num_layers ........................... 1 + 0: clip_grad ....................................... 1.0 + 0: codecarbon_dir .................................. None + 0: consumed_train_samples .......................... 0 + 0: consumed_train_tokens ........................... 0 + 0: consumed_valid_samples .......................... 0 + 0: contigious_checkpointing ........................ False + 0: cpu_optimizer ................................... False + 0: cpu_torch_adam .................................. False + 0: curriculum_learning ............................. False + 0: data_impl ....................................... mmap + 0: data_parallel_size .............................. 128 + 0: data_path ....................................... None + 0: dataloader_type ................................. single + 0: DDP_impl ........................................ local + 0: decoder_seq_length .............................. None + 0: deepscale ....................................... False + 0: deepscale_config ................................ None + 0: deepspeed ....................................... True + 0: deepspeed_activation_checkpointing .............. False + 0: deepspeed_config ................................ ds_configs/3430964.json + 0: deepspeed_mpi ................................... False + 0: distribute_checkpointed_activations ............. False + 0: distributed_backend ............................. nccl + 0: embed_layernorm ................................. False + 0: embedding_path .................................. None + 0: encoder_seq_length .............................. 2048 + 0: eod_mask_loss ................................... False + 0: eval_interval ................................... 1 + 0: eval_iters ...................................... 100 + 0: eval_only ....................................... True + 0: evidence_data_path .............................. None + 0: exit_duration_in_mins ........................... None + 0: exit_interval ................................... None + 0: ffn_hidden_size ................................. 16384 + 0: finetune ........................................ False + 0: fp16 ............................................ False + 0: fp16_lm_cross_entropy ........................... False + 0: fp32_residual_connection ........................ False + 0: gigaflos_no_embeds .............................. 0 + 0: global_batch_size ............................... 512 + 0: glu_activation .................................. None + 0: hidden_dropout .................................. 0.1 + 0: hidden_size ..................................... 4096 + 0: hysteresis ...................................... 2 + 0: ict_head_size ................................... None + 0: ict_load ........................................ None + 0: img_dim ......................................... 224 + 0: indexer_batch_size .............................. 128 + 0: indexer_log_interval ............................ 1000 + 0: inference ....................................... False + 0: init_method_std ................................. 0.02 + 0: init_method_xavier_uniform ...................... False + 0: initial_loss_scale .............................. 4294967296 + 0: kill_switch_path ................................ kill-switch-8b7178b58bval + 0: kv_channels ..................................... 128 + 0: layer_norm_fusion ............................... True + 0: layernorm_epsilon ............................... 1e-05 + 0: lazy_mpu_init ................................... None + 0: load ............................................ lm1-8b7-178b-c4-repetitions/8b7178b58b + 0: local_rank ...................................... None + 0: log_batch_size_to_tensorboard ................... True + 0: log_interval .................................... 10 + 0: log_learning_rate_to_tensorboard ................ True + 0: log_level ....................................... None + 0: log_level_replica ............................... None + 0: log_loss_scale_to_tensorboard ................... True + 0: log_num_zeros_in_grad ........................... False + 0: log_params_norm ................................. False + 0: log_path ........................................ None + 0: log_timers_to_tensorboard ....................... True + 0: log_validation_ppl_to_tensorboard ............... True + 0: loss_on_targets_only ............................ False + 0: loss_scale ...................................... None + 0: loss_scale_window ............................... 1000 + 0: lr .............................................. 0.0002 + 0: lr_decay_iters .................................. None + 0: lr_decay_samples ................................ 1 + 0: lr_decay_style .................................. cosine + 0: lr_decay_tokens ................................. None + 0: lr_warmup_fraction .............................. None + 0: lr_warmup_iters ................................. 0 + 0: lr_warmup_samples ............................... 0 + 0: make_vocab_size_divisible_by .................... 128 + 0: mask_prob ....................................... 0.15 + 0: masked_softmax_fusion ........................... True + 0: max_position_embeddings ......................... 2048 + 0: mean_noise_span_length .......................... None + 0: memory_centric_tiled_linear ..................... False + 0: merge_file ...................................... gpt2/merges.txt + 0: micro_batch_size ................................ 1 + 0: min_loss_scale .................................. 1.0 + 0: min_lr .......................................... 2e-05 + 0: mmap_warmup ..................................... False + 0: no_load_optim ................................... True + 0: no_load_rng ..................................... None + 0: no_save_optim ................................... None + 0: no_save_rng ..................................... None + 0: noise_density ................................... None + 0: num_attention_heads ............................. 32 + 0: num_channels .................................... 3 + 0: num_classes ..................................... 1000 + 0: num_layers ...................................... 42 + 0: num_layers_per_virtual_pipeline_stage ........... None + 0: num_workers ..................................... 0 + 0: onnx_safe ....................................... None + 0: openai_gelu ..................................... False + 0: optimizer ....................................... adam + 0: optimizer_fusion ................................ True + 0: override_lr_scheduler ........................... True + 0: pad_vocab_size_to ............................... None + 0: params_dtype .................................... torch.bfloat16 + 0: partition_activations ........................... False + 0: patch_dim ....................................... 16 + 0: pipeline_model_parallel_size .................... 2 + 0: position_embedding_type ......................... PositionEmbeddingType.absolute + 0: pp_partition_method ............................. None + 0: profile_backward ................................ False + 0: query_in_block_prob ............................. 0.1 + 0: rampup_batch_size ............................... None + 0: rank ............................................ 0 + 0: remote_device ................................... none + 0: reset_attention_mask ............................ False + 0: reset_position_ids .............................. False + 0: reset_progress .................................. True + 0: retriever_report_topk_accuracies ................ [] + 0: retriever_score_scaling ......................... False + 0: retriever_seq_length ............................ 256 + 0: reweight_loss_based_on_position_frequency ....... False + 0: sample_rate ..................................... 1.0 + 0: save ............................................ lm1-8b7-178b-c4-repetitions/8b7178b58b + 0: save_interval ................................... 5000 + 0: scatter_gather_tensors_in_pipeline .............. True + 0: scattered_embeddings ............................ False + 0: seed ............................................ 1234 + 0: seq_length ...................................... 2048 + 0: sgd_momentum .................................... 0.9 + 0: short_seq_prob .................................. 0.1 + 0: skip_train_iteration_range ...................... None + 0: split ........................................... None + 0: split_transformers .............................. False + 0: sync_tp_duplicated_parameters ................... False + 0: synchronize_each_layer .......................... False + 0: tensor_model_parallel_size ...................... 2 + 0: tensorboard_dir ................................. tensorboard_8b7178b58bval + 0: tensorboard_log_interval ........................ 1 + 0: tensorboard_queue_size .......................... 5 + 0: test_weighted_split_paths ....................... None + 0: test_weighted_split_paths_path .................. None + 0: tile_factor ..................................... 1 + 0: titles_data_path ................................ None + 0: tokenizer_name_or_path .......................... None + 0: tokenizer_type .................................. GPT2BPETokenizer + 0: train_iters ..................................... None + 0: train_samples ................................... 1 + 0: train_tokens .................................... None + 0: train_weighted_split_names ...................... ['train'] + 0: train_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_400M_text_document']] + 0: train_weighted_split_paths_path ................. None + 0: train_weighted_split_splits ..................... [['0:1']] + 0: train_weighted_split_weights .................... [['1.0']] + 0: universal_checkpoint ............................ False + 0: use_bnb_optimizer ............................... False + 0: use_checkpoint_lr_scheduler ..................... False + 0: use_contiguous_buffers_in_ddp ................... True + 0: use_cpu_initialization .......................... None + 0: use_one_sent_docs ............................... False + 0: use_pin_memory .................................. False + 0: valid_num_workers ............................... 0 + 0: valid_weighted_split_names ...................... ['validation'] + 0: valid_weighted_split_paths ...................... [['/scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document']] + 0: valid_weighted_split_paths_path ................. None + 0: valid_weighted_split_splits ..................... [['0:1']] + 0: valid_weighted_split_weights .................... [['1.0']] + 0: virtual_pipeline_model_parallel_size ............ None + 0: vocab_extra_ids ................................. 0 + 0: vocab_file ...................................... gpt2/vocab.json + 0: weight_decay .................................... 0.1 + 0: world_size ...................................... 512 + 0: zero_allgather_bucket_size ...................... 0.0 + 0: zero_contigious_gradients ....................... False + 0: zero_reduce_bucket_size ......................... 0.0 + 0: zero_reduce_scatter ............................. False + 0: zero_stage ...................................... 0 + 0: -------------------- end of arguments --------------------- + 0: setting number of micro-batches to constant 4 + 0: > building GPT2BPETokenizer tokenizer ... + 0: > padded vocab (size: 50257) with 175 dummy tokens (new size: 50432) + 0: DeepSpeed general environment info: + 0: torch install path ............... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch'] + 0: torch version .................... 1.13.0+rocm5.2 + 0: torch cuda version ............... None + 0: torch hip version ................ 5.2.21151-afdc89f8 + 0: nvcc version ..................... None + 0: deepspeed install path ........... ['/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/deepspeed'] + 0: deepspeed info ................... 0.7.5, unknown, unknown + 0: deepspeed wheel compiled w. ...... torch 1.13, hip 5.1 + 0: **** Git info for Megatron: git_hash=unknown git_branch=unknown **** + 0: > initializing torch distributed ... + 0: [2023-04-29 11:25:38,719] [INFO] [comm.py:633:init_distributed] Initializing TorchBackend in DeepSpeed with backend nccl + 0: > initializing tensor model parallel with size 2 + 0: > initializing pipeline model parallel with size 2 + 0: > setting random seeds to 1234 ... + 0: > initializing model parallel cuda seeds on global rank 0, model parallel rank 0, and data parallel rank 0 with model parallel seed: 3952 and data parallel seed: 1234 + 0: > compiling dataset index builder ... + 0: make: Entering directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: make: Nothing to be done for 'default'. + 0: make: Leaving directory '/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/data' + 0: >>> done with dataset index builder. Compilation time: 0.095 seconds + 0: > compiling and loading fused kernels ... + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.cpp [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_cuda.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 102 + 0: ninja: no work to do. + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda.cpp [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_cuda_kernel.cu -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/layer_norm_hip_kernel.hip [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/type_shim.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/compat.h [skipped, no changes] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_upper_triang_masked_softmax_hip.h [skipped, already hipified] + 0: /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax.h -> /pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/Megatron-DeepSpeed/megatron/fused_kernels/scaled_masked_softmax_hip.h [skipped, already hipified] + 0: Total number of unsupported CUDA function calls: 0 + 0: + 0: + 0: Total number of replaced kernel launches: 67 + 0: [1/1] c++ layer_norm_hip_kernel.cuda.o layer_norm_cuda.o -shared -L/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/venv/lib/python3.9/site-packages/torch/lib -lc10 -lc10_hip -ltorch_cpu -ltorch_hip -ltorch -ltorch_python -L/opt/rocm/lib -lamdhip64 -o fused_mix_prec_layer_norm_cuda.so + 0: >>> done with compiling and loading fused kernels. Compilation time: 26.723 seconds + 0: time to initialize megatron (seconds): 41.532 + 0: [after megatron is initialized] datetime: 2023-04-29 11:26:17 + 0: building GPT model ... + 0: [2023-04-29 11:26:17,703] [INFO] [utils.py:827:see_memory_usage] Before Building Model + 0: [2023-04-29 11:26:17,704] [INFO] [utils.py:828:see_memory_usage] MA 0.0 GB Max_MA 0.0 GB CA 0.0 GB Max_CA 0 GB + 0: [2023-04-29 11:26:17,704] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 38.33 GB, percent = 7.6% + 0: SEED_LAYERS=False BASE_SEED=1234 SEED_FN=None + 0: Using topology: {ProcessCoord(pipe=0, data=0, model=0): 0, ProcessCoord(pipe=0, data=0, model=1): 1, ProcessCoord(pipe=0, data=1, model=0): 2, ProcessCoord(pipe=0, data=1, model=1): 3, ProcessCoord(pipe=0, data=2, model=0): 4, ProcessCoord(pipe=0, data=2, model=1): 5, ProcessCoord(pipe=0, data=3, model=0): 6, ProcessCoord(pipe=0, data=3, model=1): 7, ProcessCoord(pipe=0, data=4, model=0): 8, ProcessCoord(pipe=0, data=4, model=1): 9, ProcessCoord(pipe=0, data=5, model=0): 10, ProcessCoord(pipe=0, data=5, model=1): 11, ProcessCoord(pipe=0, data=6, model=0): 12, ProcessCoord(pipe=0, data=6, model=1): 13, ProcessCoord(pipe=0, data=7, model=0): 14, ProcessCoord(pipe=0, data=7, model=1): 15, ProcessCoord(pipe=0, data=8, model=0): 16, ProcessCoord(pipe=0, data=8, model=1): 17, ProcessCoord(pipe=0, data=9, model=0): 18, ProcessCoord(pipe=0, data=9, model=1): 19, ProcessCoord(pipe=0, data=10, model=0): 20, ProcessCoord(pipe=0, data=10, model=1): 21, ProcessCoord(pipe=0, data=11, model=0): 22, ProcessCoord(pipe=0, data + 0: =11, model=1): 23, ProcessCoord(pipe=0, data=12, model=0): 24, ProcessCoord(pipe=0, data=12, model=1): 25, ProcessCoord(pipe=0, data=13, model=0): 26, ProcessCoord(pipe=0, data=13, model=1): 27, ProcessCoord(pipe=0, data=14, model=0): 28, ProcessCoord(pipe=0, data=14, model=1): 29, ProcessCoord(pipe=0, data=15, model=0): 30, ProcessCoord(pipe=0, data=15, model=1): 31, ProcessCoord(pipe=0, data=16, model=0): 32, ProcessCoord(pipe=0, data=16, model=1): 33, ProcessCoord(pipe=0, data=17, model=0): 34, ProcessCoord(pipe=0, data=17, model=1): 35, ProcessCoord(pipe=0, data=18, model=0): 36, ProcessCoord(pipe=0, data=18, model=1): 37, ProcessCoord(pipe=0, data=19, model=0): 38, ProcessCoord(pipe=0, data=19, model=1): 39, ProcessCoord(pipe=0, data=20, model=0): 40, ProcessCoord(pipe=0, data=20, model=1): 41, ProcessCoord(pipe=0, data=21, model=0): 42, ProcessCoord(pipe=0, data=21, model=1): 43, ProcessCoord(pipe=0, data=22, model=0): 44, ProcessCoord(pipe=0, data=22, model=1): 45, ProcessCoord(pipe=0, data=23, model=0 + 0: ): 46, ProcessCoord(pipe=0, data=23, model=1): 47, ProcessCoord(pipe=0, data=24, model=0): 48, ProcessCoord(pipe=0, data=24, model=1): 49, ProcessCoord(pipe=0, data=25, model=0): 50, ProcessCoord(pipe=0, data=25, model=1): 51, ProcessCoord(pipe=0, data=26, model=0): 52, ProcessCoord(pipe=0, data=26, model=1): 53, ProcessCoord(pipe=0, data=27, model=0): 54, ProcessCoord(pipe=0, data=27, model=1): 55, ProcessCoord(pipe=0, data=28, model=0): 56, ProcessCoord(pipe=0, data=28, model=1): 57, ProcessCoord(pipe=0, data=29, model=0): 58, ProcessCoord(pipe=0, data=29, model=1): 59, ProcessCoord(pipe=0, data=30, model=0): 60, ProcessCoord(pipe=0, data=30, model=1): 61, ProcessCoord(pipe=0, data=31, model=0): 62, ProcessCoord(pipe=0, data=31, model=1): 63, ProcessCoord(pipe=0, data=32, model=0): 64, ProcessCoord(pipe=0, data=32, model=1): 65, ProcessCoord(pipe=0, data=33, model=0): 66, ProcessCoord(pipe=0, data=33, model=1): 67, ProcessCoord(pipe=0, data=34, model=0): 68, ProcessCoord(pipe=0, data=34, model=1): 69, Proce + 0: ssCoord(pipe=0, data=35, model=0): 70, ProcessCoord(pipe=0, data=35, model=1): 71, ProcessCoord(pipe=0, data=36, model=0): 72, ProcessCoord(pipe=0, data=36, model=1): 73, ProcessCoord(pipe=0, data=37, model=0): 74, ProcessCoord(pipe=0, data=37, model=1): 75, ProcessCoord(pipe=0, data=38, model=0): 76, ProcessCoord(pipe=0, data=38, model=1): 77, ProcessCoord(pipe=0, data=39, model=0): 78, ProcessCoord(pipe=0, data=39, model=1): 79, ProcessCoord(pipe=0, data=40, model=0): 80, ProcessCoord(pipe=0, data=40, model=1): 81, ProcessCoord(pipe=0, data=41, model=0): 82, ProcessCoord(pipe=0, data=41, model=1): 83, ProcessCoord(pipe=0, data=42, model=0): 84, ProcessCoord(pipe=0, data=42, model=1): 85, ProcessCoord(pipe=0, data=43, model=0): 86, ProcessCoord(pipe=0, data=43, model=1): 87, ProcessCoord(pipe=0, data=44, model=0): 88, ProcessCoord(pipe=0, data=44, model=1): 89, ProcessCoord(pipe=0, data=45, model=0): 90, ProcessCoord(pipe=0, data=45, model=1): 91, ProcessCoord(pipe=0, data=46, model=0): 92, ProcessCoord(pipe + 0: =0, data=46, model=1): 93, ProcessCoord(pipe=0, data=47, model=0): 94, ProcessCoord(pipe=0, data=47, model=1): 95, ProcessCoord(pipe=0, data=48, model=0): 96, ProcessCoord(pipe=0, data=48, model=1): 97, ProcessCoord(pipe=0, data=49, model=0): 98, ProcessCoord(pipe=0, data=49, model=1): 99, ProcessCoord(pipe=0, data=50, model=0): 100, ProcessCoord(pipe=0, data=50, model=1): 101, ProcessCoord(pipe=0, data=51, model=0): 102, ProcessCoord(pipe=0, data=51, model=1): 103, ProcessCoord(pipe=0, data=52, model=0): 104, ProcessCoord(pipe=0, data=52, model=1): 105, ProcessCoord(pipe=0, data=53, model=0): 106, ProcessCoord(pipe=0, data=53, model=1): 107, ProcessCoord(pipe=0, data=54, model=0): 108, ProcessCoord(pipe=0, data=54, model=1): 109, ProcessCoord(pipe=0, data=55, model=0): 110, ProcessCoord(pipe=0, data=55, model=1): 111, ProcessCoord(pipe=0, data=56, model=0): 112, ProcessCoord(pipe=0, data=56, model=1): 113, ProcessCoord(pipe=0, data=57, model=0): 114, ProcessCoord(pipe=0, data=57, model=1): 115, ProcessCoord( + 0: pipe=0, data=58, model=0): 116, ProcessCoord(pipe=0, data=58, model=1): 117, ProcessCoord(pipe=0, data=59, model=0): 118, ProcessCoord(pipe=0, data=59, model=1): 119, ProcessCoord(pipe=0, data=60, model=0): 120, ProcessCoord(pipe=0, data=60, model=1): 121, ProcessCoord(pipe=0, data=61, model=0): 122, ProcessCoord(pipe=0, data=61, model=1): 123, ProcessCoord(pipe=0, data=62, model=0): 124, ProcessCoord(pipe=0, data=62, model=1): 125, ProcessCoord(pipe=0, data=63, model=0): 126, ProcessCoord(pipe=0, data=63, model=1): 127, ProcessCoord(pipe=0, data=64, model=0): 128, ProcessCoord(pipe=0, data=64, model=1): 129, ProcessCoord(pipe=0, data=65, model=0): 130, ProcessCoord(pipe=0, data=65, model=1): 131, ProcessCoord(pipe=0, data=66, model=0): 132, ProcessCoord(pipe=0, data=66, model=1): 133, ProcessCoord(pipe=0, data=67, model=0): 134, ProcessCoord(pipe=0, data=67, model=1): 135, ProcessCoord(pipe=0, data=68, model=0): 136, ProcessCoord(pipe=0, data=68, model=1): 137, ProcessCoord(pipe=0, data=69, model=0): 138, Pr + 0: ocessCoord(pipe=0, data=69, model=1): 139, ProcessCoord(pipe=0, data=70, model=0): 140, ProcessCoord(pipe=0, data=70, model=1): 141, ProcessCoord(pipe=0, data=71, model=0): 142, ProcessCoord(pipe=0, data=71, model=1): 143, ProcessCoord(pipe=0, data=72, model=0): 144, ProcessCoord(pipe=0, data=72, model=1): 145, ProcessCoord(pipe=0, data=73, model=0): 146, ProcessCoord(pipe=0, data=73, model=1): 147, ProcessCoord(pipe=0, data=74, model=0): 148, ProcessCoord(pipe=0, data=74, model=1): 149, ProcessCoord(pipe=0, data=75, model=0): 150, ProcessCoord(pipe=0, data=75, model=1): 151, ProcessCoord(pipe=0, data=76, model=0): 152, ProcessCoord(pipe=0, data=76, model=1): 153, ProcessCoord(pipe=0, data=77, model=0): 154, ProcessCoord(pipe=0, data=77, model=1): 155, ProcessCoord(pipe=0, data=78, model=0): 156, ProcessCoord(pipe=0, data=78, model=1): 157, ProcessCoord(pipe=0, data=79, model=0): 158, ProcessCoord(pipe=0, data=79, model=1): 159, ProcessCoord(pipe=0, data=80, model=0): 160, ProcessCoord(pipe=0, data=80, model= + 0: 1): 161, ProcessCoord(pipe=0, data=81, model=0): 162, ProcessCoord(pipe=0, data=81, model=1): 163, ProcessCoord(pipe=0, data=82, model=0): 164, ProcessCoord(pipe=0, data=82, model=1): 165, ProcessCoord(pipe=0, data=83, model=0): 166, ProcessCoord(pipe=0, data=83, model=1): 167, ProcessCoord(pipe=0, data=84, model=0): 168, ProcessCoord(pipe=0, data=84, model=1): 169, ProcessCoord(pipe=0, data=85, model=0): 170, ProcessCoord(pipe=0, data=85, model=1): 171, ProcessCoord(pipe=0, data=86, model=0): 172, ProcessCoord(pipe=0, data=86, model=1): 173, ProcessCoord(pipe=0, data=87, model=0): 174, ProcessCoord(pipe=0, data=87, model=1): 175, ProcessCoord(pipe=0, data=88, model=0): 176, ProcessCoord(pipe=0, data=88, model=1): 177, ProcessCoord(pipe=0, data=89, model=0): 178, ProcessCoord(pipe=0, data=89, model=1): 179, ProcessCoord(pipe=0, data=90, model=0): 180, ProcessCoord(pipe=0, data=90, model=1): 181, ProcessCoord(pipe=0, data=91, model=0): 182, ProcessCoord(pipe=0, data=91, model=1): 183, ProcessCoord(pipe=0, data + 0: =92, model=0): 184, ProcessCoord(pipe=0, data=92, model=1): 185, ProcessCoord(pipe=0, data=93, model=0): 186, ProcessCoord(pipe=0, data=93, model=1): 187, ProcessCoord(pipe=0, data=94, model=0): 188, ProcessCoord(pipe=0, data=94, model=1): 189, ProcessCoord(pipe=0, data=95, model=0): 190, ProcessCoord(pipe=0, data=95, model=1): 191, ProcessCoord(pipe=0, data=96, model=0): 192, ProcessCoord(pipe=0, data=96, model=1): 193, ProcessCoord(pipe=0, data=97, model=0): 194, ProcessCoord(pipe=0, data=97, model=1): 195, ProcessCoord(pipe=0, data=98, model=0): 196, ProcessCoord(pipe=0, data=98, model=1): 197, ProcessCoord(pipe=0, data=99, model=0): 198, ProcessCoord(pipe=0, data=99, model=1): 199, ProcessCoord(pipe=0, data=100, model=0): 200, ProcessCoord(pipe=0, data=100, model=1): 201, ProcessCoord(pipe=0, data=101, model=0): 202, ProcessCoord(pipe=0, data=101, model=1): 203, ProcessCoord(pipe=0, data=102, model=0): 204, ProcessCoord(pipe=0, data=102, model=1): 205, ProcessCoord(pipe=0, data=103, model=0): 206, Process + 0: Coord(pipe=0, data=103, model=1): 207, ProcessCoord(pipe=0, data=104, model=0): 208, ProcessCoord(pipe=0, data=104, model=1): 209, ProcessCoord(pipe=0, data=105, model=0): 210, ProcessCoord(pipe=0, data=105, model=1): 211, ProcessCoord(pipe=0, data=106, model=0): 212, ProcessCoord(pipe=0, data=106, model=1): 213, ProcessCoord(pipe=0, data=107, model=0): 214, ProcessCoord(pipe=0, data=107, model=1): 215, ProcessCoord(pipe=0, data=108, model=0): 216, ProcessCoord(pipe=0, data=108, model=1): 217, ProcessCoord(pipe=0, data=109, model=0): 218, ProcessCoord(pipe=0, data=109, model=1): 219, ProcessCoord(pipe=0, data=110, model=0): 220, ProcessCoord(pipe=0, data=110, model=1): 221, ProcessCoord(pipe=0, data=111, model=0): 222, ProcessCoord(pipe=0, data=111, model=1): 223, ProcessCoord(pipe=0, data=112, model=0): 224, ProcessCoord(pipe=0, data=112, model=1): 225, ProcessCoord(pipe=0, data=113, model=0): 226, ProcessCoord(pipe=0, data=113, model=1): 227, ProcessCoord(pipe=0, data=114, model=0): 228, ProcessCoord(pipe=0 + 0: , data=114, model=1): 229, ProcessCoord(pipe=0, data=115, model=0): 230, ProcessCoord(pipe=0, data=115, model=1): 231, ProcessCoord(pipe=0, data=116, model=0): 232, ProcessCoord(pipe=0, data=116, model=1): 233, ProcessCoord(pipe=0, data=117, model=0): 234, ProcessCoord(pipe=0, data=117, model=1): 235, ProcessCoord(pipe=0, data=118, model=0): 236, ProcessCoord(pipe=0, data=118, model=1): 237, ProcessCoord(pipe=0, data=119, model=0): 238, ProcessCoord(pipe=0, data=119, model=1): 239, ProcessCoord(pipe=0, data=120, model=0): 240, ProcessCoord(pipe=0, data=120, model=1): 241, ProcessCoord(pipe=0, data=121, model=0): 242, ProcessCoord(pipe=0, data=121, model=1): 243, ProcessCoord(pipe=0, data=122, model=0): 244, ProcessCoord(pipe=0, data=122, model=1): 245, ProcessCoord(pipe=0, data=123, model=0): 246, ProcessCoord(pipe=0, data=123, model=1): 247, ProcessCoord(pipe=0, data=124, model=0): 248, ProcessCoord(pipe=0, data=124, model=1): 249, ProcessCoord(pipe=0, data=125, model=0): 250, ProcessCoord(pipe=0, data=125, + 0: model=1): 251, ProcessCoord(pipe=0, data=126, model=0): 252, ProcessCoord(pipe=0, data=126, model=1): 253, ProcessCoord(pipe=0, data=127, model=0): 254, ProcessCoord(pipe=0, data=127, model=1): 255, ProcessCoord(pipe=1, data=0, model=0): 256, ProcessCoord(pipe=1, data=0, model=1): 257, ProcessCoord(pipe=1, data=1, model=0): 258, ProcessCoord(pipe=1, data=1, model=1): 259, ProcessCoord(pipe=1, data=2, model=0): 260, ProcessCoord(pipe=1, data=2, model=1): 261, ProcessCoord(pipe=1, data=3, model=0): 262, ProcessCoord(pipe=1, data=3, model=1): 263, ProcessCoord(pipe=1, data=4, model=0): 264, ProcessCoord(pipe=1, data=4, model=1): 265, ProcessCoord(pipe=1, data=5, model=0): 266, ProcessCoord(pipe=1, data=5, model=1): 267, ProcessCoord(pipe=1, data=6, model=0): 268, ProcessCoord(pipe=1, data=6, model=1): 269, ProcessCoord(pipe=1, data=7, model=0): 270, ProcessCoord(pipe=1, data=7, model=1): 271, ProcessCoord(pipe=1, data=8, model=0): 272, ProcessCoord(pipe=1, data=8, model=1): 273, ProcessCoord(pipe=1, data=9, mode + 0: l=0): 274, ProcessCoord(pipe=1, data=9, model=1): 275, ProcessCoord(pipe=1, data=10, model=0): 276, ProcessCoord(pipe=1, data=10, model=1): 277, ProcessCoord(pipe=1, data=11, model=0): 278, ProcessCoord(pipe=1, data=11, model=1): 279, ProcessCoord(pipe=1, data=12, model=0): 280, ProcessCoord(pipe=1, data=12, model=1): 281, ProcessCoord(pipe=1, data=13, model=0): 282, ProcessCoord(pipe=1, data=13, model=1): 283, ProcessCoord(pipe=1, data=14, model=0): 284, ProcessCoord(pipe=1, data=14, model=1): 285, ProcessCoord(pipe=1, data=15, model=0): 286, ProcessCoord(pipe=1, data=15, model=1): 287, ProcessCoord(pipe=1, data=16, model=0): 288, ProcessCoord(pipe=1, data=16, model=1): 289, ProcessCoord(pipe=1, data=17, model=0): 290, ProcessCoord(pipe=1, data=17, model=1): 291, ProcessCoord(pipe=1, data=18, model=0): 292, ProcessCoord(pipe=1, data=18, model=1): 293, ProcessCoord(pipe=1, data=19, model=0): 294, ProcessCoord(pipe=1, data=19, model=1): 295, ProcessCoord(pipe=1, data=20, model=0): 296, ProcessCoord(pipe=1, dat + 0: a=20, model=1): 297, ProcessCoord(pipe=1, data=21, model=0): 298, ProcessCoord(pipe=1, data=21, model=1): 299, ProcessCoord(pipe=1, data=22, model=0): 300, ProcessCoord(pipe=1, data=22, model=1): 301, ProcessCoord(pipe=1, data=23, model=0): 302, ProcessCoord(pipe=1, data=23, model=1): 303, ProcessCoord(pipe=1, data=24, model=0): 304, ProcessCoord(pipe=1, data=24, model=1): 305, ProcessCoord(pipe=1, data=25, model=0): 306, ProcessCoord(pipe=1, data=25, model=1): 307, ProcessCoord(pipe=1, data=26, model=0): 308, ProcessCoord(pipe=1, data=26, model=1): 309, ProcessCoord(pipe=1, data=27, model=0): 310, ProcessCoord(pipe=1, data=27, model=1): 311, ProcessCoord(pipe=1, data=28, model=0): 312, ProcessCoord(pipe=1, data=28, model=1): 313, ProcessCoord(pipe=1, data=29, model=0): 314, ProcessCoord(pipe=1, data=29, model=1): 315, ProcessCoord(pipe=1, data=30, model=0): 316, ProcessCoord(pipe=1, data=30, model=1): 317, ProcessCoord(pipe=1, data=31, model=0): 318, ProcessCoord(pipe=1, data=31, model=1): 319, ProcessCoord( + 0: pipe=1, data=32, model=0): 320, ProcessCoord(pipe=1, data=32, model=1): 321, ProcessCoord(pipe=1, data=33, model=0): 322, ProcessCoord(pipe=1, data=33, model=1): 323, ProcessCoord(pipe=1, data=34, model=0): 324, ProcessCoord(pipe=1, data=34, model=1): 325, ProcessCoord(pipe=1, data=35, model=0): 326, ProcessCoord(pipe=1, data=35, model=1): 327, ProcessCoord(pipe=1, data=36, model=0): 328, ProcessCoord(pipe=1, data=36, model=1): 329, ProcessCoord(pipe=1, data=37, model=0): 330, ProcessCoord(pipe=1, data=37, model=1): 331, ProcessCoord(pipe=1, data=38, model=0): 332, ProcessCoord(pipe=1, data=38, model=1): 333, ProcessCoord(pipe=1, data=39, model=0): 334, ProcessCoord(pipe=1, data=39, model=1): 335, ProcessCoord(pipe=1, data=40, model=0): 336, ProcessCoord(pipe=1, data=40, model=1): 337, ProcessCoord(pipe=1, data=41, model=0): 338, ProcessCoord(pipe=1, data=41, model=1): 339, ProcessCoord(pipe=1, data=42, model=0): 340, ProcessCoord(pipe=1, data=42, model=1): 341, ProcessCoord(pipe=1, data=43, model=0): 342, Pr + 0: ocessCoord(pipe=1, data=43, model=1): 343, ProcessCoord(pipe=1, data=44, model=0): 344, ProcessCoord(pipe=1, data=44, model=1): 345, ProcessCoord(pipe=1, data=45, model=0): 346, ProcessCoord(pipe=1, data=45, model=1): 347, ProcessCoord(pipe=1, data=46, model=0): 348, ProcessCoord(pipe=1, data=46, model=1): 349, ProcessCoord(pipe=1, data=47, model=0): 350, ProcessCoord(pipe=1, data=47, model=1): 351, ProcessCoord(pipe=1, data=48, model=0): 352, ProcessCoord(pipe=1, data=48, model=1): 353, ProcessCoord(pipe=1, data=49, model=0): 354, ProcessCoord(pipe=1, data=49, model=1): 355, ProcessCoord(pipe=1, data=50, model=0): 356, ProcessCoord(pipe=1, data=50, model=1): 357, ProcessCoord(pipe=1, data=51, model=0): 358, ProcessCoord(pipe=1, data=51, model=1): 359, ProcessCoord(pipe=1, data=52, model=0): 360, ProcessCoord(pipe=1, data=52, model=1): 361, ProcessCoord(pipe=1, data=53, model=0): 362, ProcessCoord(pipe=1, data=53, model=1): 363, ProcessCoord(pipe=1, data=54, model=0): 364, ProcessCoord(pipe=1, data=54, model= + 0: 1): 365, ProcessCoord(pipe=1, data=55, model=0): 366, ProcessCoord(pipe=1, data=55, model=1): 367, ProcessCoord(pipe=1, data=56, model=0): 368, ProcessCoord(pipe=1, data=56, model=1): 369, ProcessCoord(pipe=1, data=57, model=0): 370, ProcessCoord(pipe=1, data=57, model=1): 371, ProcessCoord(pipe=1, data=58, model=0): 372, ProcessCoord(pipe=1, data=58, model=1): 373, ProcessCoord(pipe=1, data=59, model=0): 374, ProcessCoord(pipe=1, data=59, model=1): 375, ProcessCoord(pipe=1, data=60, model=0): 376, ProcessCoord(pipe=1, data=60, model=1): 377, ProcessCoord(pipe=1, data=61, model=0): 378, ProcessCoord(pipe=1, data=61, model=1): 379, ProcessCoord(pipe=1, data=62, model=0): 380, ProcessCoord(pipe=1, data=62, model=1): 381, ProcessCoord(pipe=1, data=63, model=0): 382, ProcessCoord(pipe=1, data=63, model=1): 383, ProcessCoord(pipe=1, data=64, model=0): 384, ProcessCoord(pipe=1, data=64, model=1): 385, ProcessCoord(pipe=1, data=65, model=0): 386, ProcessCoord(pipe=1, data=65, model=1): 387, ProcessCoord(pipe=1, data + 0: =66, model=0): 388, ProcessCoord(pipe=1, data=66, model=1): 389, ProcessCoord(pipe=1, data=67, model=0): 390, ProcessCoord(pipe=1, data=67, model=1): 391, ProcessCoord(pipe=1, data=68, model=0): 392, ProcessCoord(pipe=1, data=68, model=1): 393, ProcessCoord(pipe=1, data=69, model=0): 394, ProcessCoord(pipe=1, data=69, model=1): 395, ProcessCoord(pipe=1, data=70, model=0): 396, ProcessCoord(pipe=1, data=70, model=1): 397, ProcessCoord(pipe=1, data=71, model=0): 398, ProcessCoord(pipe=1, data=71, model=1): 399, ProcessCoord(pipe=1, data=72, model=0): 400, ProcessCoord(pipe=1, data=72, model=1): 401, ProcessCoord(pipe=1, data=73, model=0): 402, ProcessCoord(pipe=1, data=73, model=1): 403, ProcessCoord(pipe=1, data=74, model=0): 404, ProcessCoord(pipe=1, data=74, model=1): 405, ProcessCoord(pipe=1, data=75, model=0): 406, ProcessCoord(pipe=1, data=75, model=1): 407, ProcessCoord(pipe=1, data=76, model=0): 408, ProcessCoord(pipe=1, data=76, model=1): 409, ProcessCoord(pipe=1, data=77, model=0): 410, ProcessCoord(p + 0: ipe=1, data=77, model=1): 411, ProcessCoord(pipe=1, data=78, model=0): 412, ProcessCoord(pipe=1, data=78, model=1): 413, ProcessCoord(pipe=1, data=79, model=0): 414, ProcessCoord(pipe=1, data=79, model=1): 415, ProcessCoord(pipe=1, data=80, model=0): 416, ProcessCoord(pipe=1, data=80, model=1): 417, ProcessCoord(pipe=1, data=81, model=0): 418, ProcessCoord(pipe=1, data=81, model=1): 419, ProcessCoord(pipe=1, data=82, model=0): 420, ProcessCoord(pipe=1, data=82, model=1): 421, ProcessCoord(pipe=1, data=83, model=0): 422, ProcessCoord(pipe=1, data=83, model=1): 423, ProcessCoord(pipe=1, data=84, model=0): 424, ProcessCoord(pipe=1, data=84, model=1): 425, ProcessCoord(pipe=1, data=85, model=0): 426, ProcessCoord(pipe=1, data=85, model=1): 427, ProcessCoord(pipe=1, data=86, model=0): 428, ProcessCoord(pipe=1, data=86, model=1): 429, ProcessCoord(pipe=1, data=87, model=0): 430, ProcessCoord(pipe=1, data=87, model=1): 431, ProcessCoord(pipe=1, data=88, model=0): 432, ProcessCoord(pipe=1, data=88, model=1): 433, Pro + 0: cessCoord(pipe=1, data=89, model=0): 434, ProcessCoord(pipe=1, data=89, model=1): 435, ProcessCoord(pipe=1, data=90, model=0): 436, ProcessCoord(pipe=1, data=90, model=1): 437, ProcessCoord(pipe=1, data=91, model=0): 438, ProcessCoord(pipe=1, data=91, model=1): 439, ProcessCoord(pipe=1, data=92, model=0): 440, ProcessCoord(pipe=1, data=92, model=1): 441, ProcessCoord(pipe=1, data=93, model=0): 442, ProcessCoord(pipe=1, data=93, model=1): 443, ProcessCoord(pipe=1, data=94, model=0): 444, ProcessCoord(pipe=1, data=94, model=1): 445, ProcessCoord(pipe=1, data=95, model=0): 446, ProcessCoord(pipe=1, data=95, model=1): 447, ProcessCoord(pipe=1, data=96, model=0): 448, ProcessCoord(pipe=1, data=96, model=1): 449, ProcessCoord(pipe=1, data=97, model=0): 450, ProcessCoord(pipe=1, data=97, model=1): 451, ProcessCoord(pipe=1, data=98, model=0): 452, ProcessCoord(pipe=1, data=98, model=1): 453, ProcessCoord(pipe=1, data=99, model=0): 454, ProcessCoord(pipe=1, data=99, model=1): 455, ProcessCoord(pipe=1, data=100, model= + 0: 0): 456, ProcessCoord(pipe=1, data=100, model=1): 457, ProcessCoord(pipe=1, data=101, model=0): 458, ProcessCoord(pipe=1, data=101, model=1): 459, ProcessCoord(pipe=1, data=102, model=0): 460, ProcessCoord(pipe=1, data=102, model=1): 461, ProcessCoord(pipe=1, data=103, model=0): 462, ProcessCoord(pipe=1, data=103, model=1): 463, ProcessCoord(pipe=1, data=104, model=0): 464, ProcessCoord(pipe=1, data=104, model=1): 465, ProcessCoord(pipe=1, data=105, model=0): 466, ProcessCoord(pipe=1, data=105, model=1): 467, ProcessCoord(pipe=1, data=106, model=0): 468, ProcessCoord(pipe=1, data=106, model=1): 469, ProcessCoord(pipe=1, data=107, model=0): 470, ProcessCoord(pipe=1, data=107, model=1): 471, ProcessCoord(pipe=1, data=108, model=0): 472, ProcessCoord(pipe=1, data=108, model=1): 473, ProcessCoord(pipe=1, data=109, model=0): 474, ProcessCoord(pipe=1, data=109, model=1): 475, ProcessCoord(pipe=1, data=110, model=0): 476, ProcessCoord(pipe=1, data=110, model=1): 477, ProcessCoord(pipe=1, data=111, model=0): 478, Pro + 0: cessCoord(pipe=1, data=111, model=1): 479, ProcessCoord(pipe=1, data=112, model=0): 480, ProcessCoord(pipe=1, data=112, model=1): 481, ProcessCoord(pipe=1, data=113, model=0): 482, ProcessCoord(pipe=1, data=113, model=1): 483, ProcessCoord(pipe=1, data=114, model=0): 484, ProcessCoord(pipe=1, data=114, model=1): 485, ProcessCoord(pipe=1, data=115, model=0): 486, ProcessCoord(pipe=1, data=115, model=1): 487, ProcessCoord(pipe=1, data=116, model=0): 488, ProcessCoord(pipe=1, data=116, model=1): 489, ProcessCoord(pipe=1, data=117, model=0): 490, ProcessCoord(pipe=1, data=117, model=1): 491, ProcessCoord(pipe=1, data=118, model=0): 492, ProcessCoord(pipe=1, data=118, model=1): 493, ProcessCoord(pipe=1, data=119, model=0): 494, ProcessCoord(pipe=1, data=119, model=1): 495, ProcessCoord(pipe=1, data=120, model=0): 496, ProcessCoord(pipe=1, data=120, model=1): 497, ProcessCoord(pipe=1, data=121, model=0): 498, ProcessCoord(pipe=1, data=121, model=1): 499, ProcessCoord(pipe=1, data=122, model=0): 500, ProcessCoord(pi + 0: pe=1, data=122, model=1): 501, ProcessCoord(pipe=1, data=123, model=0): 502, ProcessCoord(pipe=1, data=123, model=1): 503, ProcessCoord(pipe=1, data=124, model=0): 504, ProcessCoord(pipe=1, data=124, model=1): 505, ProcessCoord(pipe=1, data=125, model=0): 506, ProcessCoord(pipe=1, data=125, model=1): 507, ProcessCoord(pipe=1, data=126, model=0): 508, ProcessCoord(pipe=1, data=126, model=1): 509, ProcessCoord(pipe=1, data=127, model=0): 510, ProcessCoord(pipe=1, data=127, model=1): 511} + 0: [2023-04-29 11:26:26,003] [INFO] [module.py:366:_partition_layers] Partitioning pipeline stages with method type:transformer + 0: stage=0 layers=24 + 0: 0: _to_float16 + 0: 1: EmbeddingPipe + 0: 2: + 0: 3: ParallelTransformerLayerPipe + 0: 4: ParallelTransformerLayerPipe + 0: 5: ParallelTransformerLayerPipe + 0: 6: ParallelTransformerLayerPipe + 0: 7: ParallelTransformerLayerPipe + 0: 8: ParallelTransformerLayerPipe + 0: 9: ParallelTransformerLayerPipe + 0: 10: ParallelTransformerLayerPipe + 0: 11: ParallelTransformerLayerPipe + 0: 12: ParallelTransformerLayerPipe + 0: 13: ParallelTransformerLayerPipe + 0: 14: ParallelTransformerLayerPipe + 0: 15: ParallelTransformerLayerPipe + 0: 16: ParallelTransformerLayerPipe + 0: 17: ParallelTransformerLayerPipe + 0: 18: ParallelTransformerLayerPipe + 0: 19: ParallelTransformerLayerPipe + 0: 20: ParallelTransformerLayerPipe + 0: 21: ParallelTransformerLayerPipe + 0: 22: ParallelTransformerLayerPipe + 0: 23: ParallelTransformerLayerPipe + 0: stage=1 layers=25 + 0: 24: ParallelTransformerLayerPipe + 0: 25: ParallelTransformerLayerPipe + 0: 26: ParallelTransformerLayerPipe + 0: 27: ParallelTransformerLayerPipe + 0: 28: ParallelTransformerLayerPipe + 0: 29: ParallelTransformerLayerPipe + 0: 30: ParallelTransformerLayerPipe + 0: 31: ParallelTransformerLayerPipe + 0: 32: ParallelTransformerLayerPipe + 0: 33: ParallelTransformerLayerPipe + 0: 34: ParallelTransformerLayerPipe + 0: 35: ParallelTransformerLayerPipe + 0: 36: ParallelTransformerLayerPipe + 0: 37: ParallelTransformerLayerPipe + 0: 38: ParallelTransformerLayerPipe + 0: 39: ParallelTransformerLayerPipe + 0: 40: ParallelTransformerLayerPipe + 0: 41: ParallelTransformerLayerPipe + 0: 42: ParallelTransformerLayerPipe + 0: 43: ParallelTransformerLayerPipe + 0: 44: ParallelTransformerLayerPipe + 0: 45: undo + 0: 46: MixedFusedLayerNorm + 0: 47: EmbeddingPipe + 0: 48: float16_to_fp32 + 0: loss: CrossEntropy + 0: [2023-04-29 11:26:30,084] [INFO] [utils.py:827:see_memory_usage] After Building Model + 0: [2023-04-29 11:26:30,085] [INFO] [utils.py:828:see_memory_usage] MA 4.16 GB Max_MA 4.16 GB CA 4.17 GB Max_CA 4 GB + 0: [2023-04-29 11:26:30,085] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.18 GB, percent = 7.8% + 0: setting training iterations to 0 + 0: > learning rate decay style: cosine + 0: DeepSpeed is enabled. + 0: [2023-04-29 11:26:30,087] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed info: version=0.7.5, git-hash=unknown, git-branch=unknown + 0: [2023-04-29 11:26:34,491] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Flops Profiler Enabled: False + 0: [2023-04-29 11:26:34,491] [INFO] [logging.py:68:log_dist] [Rank 0] Removing param_group that has no 'params' in the client Optimizer + 0: [2023-04-29 11:26:34,491] [INFO] [logging.py:68:log_dist] [Rank 0] Using client Optimizer as basic optimizer + 0: [2023-04-29 11:26:34,500] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Basic Optimizer = FusedAdam + 0: [2023-04-29 11:26:34,500] [INFO] [logging.py:68:log_dist] [Rank 0] Creating BF16 optimizer + 0: [2023-04-29 11:26:34,640] [INFO] [utils.py:827:see_memory_usage] begin bf16_optimizer + 0: [2023-04-29 11:26:34,640] [INFO] [utils.py:828:see_memory_usage] MA 4.15 GB Max_MA 4.18 GB CA 4.18 GB Max_CA 4 GB + 0: [2023-04-29 11:26:34,641] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.8 GB, percent = 7.9% + 0: ninja: no work to do. + 0: Time to load utils op: 0.1796567440032959 seconds +32: Time to load utils op: 0.11121702194213867 seconds +32: Time to load utils op: 0.10224366188049316 seconds +32: Time to load utils op: 0.10191917419433594 seconds +32: Time to load utils op: 0.10198116302490234 seconds + 0: Time to load utils op: 0.20494723320007324 seconds + 0: Time to load utils op: 0.2044064998626709 seconds + 0: Time to load utils op: 0.10336589813232422 seconds +33: Time to load utils op: 0.1124734878540039 secondsTime to load utils op: 0.11177778244018555 secondsTime to load utils op: 0.11172270774841309 seconds +33: +33: +33: Time to load utils op: 0.11175751686096191 seconds + 2: Time to load utils op: 0.2117912769317627 seconds + 2: Time to load utils op: 0.21182012557983398 seconds + 2: Time to load utils op: 0.2120213508605957 secondsTime to load utils op: 0.21200227737426758 seconds + 2: + 5: Time to load utils op: 0.21182656288146973 secondsTime to load utils op: 0.2117304801940918 seconds + 5: + 5: Time to load utils op: 0.21178269386291504 secondsTime to load utils op: 0.2113513946533203 seconds + 5: + 6: Time to load utils op: 0.21216320991516113 secondsTime to load utils op: 0.2121596336364746 secondsTime to load utils op: 0.21181797981262207 seconds + 6: + 6: + 6: Time to load utils op: 0.21151447296142578 seconds + 8: Time to load utils op: 0.21045494079589844 secondsTime to load utils op: 0.21068096160888672 secondsTime to load utils op: 0.2104511260986328 secondsTime to load utils op: 0.21089816093444824 seconds + 8: + 8: + 8: +10: Time to load utils op: 0.21154212951660156 secondsTime to load utils op: 0.21170711517333984 seconds +10: +10: Time to load utils op: 0.21117138862609863 secondsTime to load utils op: 0.21091318130493164 seconds +10: +36: Time to load utils op: 0.11569523811340332 secondsTime to load utils op: 0.11541223526000977 secondsTime to load utils op: 0.11571955680847168 seconds +36: +36: +36: Time to load utils op: 0.11548924446105957 seconds +35: Time to load utils op: 0.11336135864257812 secondsTime to load utils op: 0.11334729194641113 secondsTime to load utils op: 0.11336731910705566 secondsTime to load utils op: 0.11336374282836914 seconds +35: +35: +35: +34: Time to load utils op: 0.1150672435760498 secondsTime to load utils op: 0.1150660514831543 secondsTime to load utils op: 0.11507153511047363 seconds +34: +34: +34: Time to load utils op: 0.11507916450500488 seconds + 4: Time to load utils op: 0.21120572090148926 seconds + 4: Time to load utils op: 0.21120619773864746 seconds + 4: Time to load utils op: 0.21120858192443848 seconds + 4: Time to load utils op: 0.21112942695617676 seconds + 7: Time to load utils op: 0.21231293678283691 secondsTime to load utils op: 0.21232128143310547 secondsTime to load utils op: 0.21231961250305176 seconds + 7: + 7: + 7: Time to load utils op: 0.2123270034790039 seconds +44: Time to load utils op: 0.11675500869750977 secondsTime to load utils op: 0.11697196960449219 secondsTime to load utils op: 0.11702394485473633 secondsTime to load utils op: 0.11697578430175781 seconds +44: +44: +44: +40: Time to load utils op: 0.11626029014587402 secondsTime to load utils op: 0.11626172065734863 secondsTime to load utils op: 0.11626219749450684 seconds +40: +40: +40: Time to load utils op: 0.11618947982788086 seconds + 9: Time to load utils op: 0.21276283264160156 seconds + 9: Time to load utils op: 0.2127687931060791 seconds + 9: Time to load utils op: 0.21277070045471191 secondsTime to load utils op: 0.21277594566345215 seconds + 9: + 1: Time to load utils op: 0.21506667137145996 secondsTime to load utils op: 0.21506834030151367 secondsTime to load utils op: 0.215073823928833 seconds + 1: + 1: + 1: Time to load utils op: 0.21505475044250488 seconds +41: Time to load utils op: 0.11639690399169922 secondsTime to load utils op: 0.11639142036437988 secondsTime to load utils op: 0.11638927459716797 secondsTime to load utils op: 0.11624908447265625 seconds +41: +41: +41: +37: Time to load utils op: 0.11829185485839844 seconds +37: Time to load utils op: 0.11830401420593262 secondsTime to load utils op: 0.11831068992614746 seconds +37: +37: Time to load utils op: 0.11827468872070312 seconds +39: Time to load utils op: 0.11857318878173828 secondsTime to load utils op: 0.11858940124511719 seconds +39: +39: Time to load utils op: 0.11857485771179199 seconds +39: Time to load utils op: 0.11858415603637695 seconds + 3: Time to load utils op: 0.21513152122497559 secondsTime to load utils op: 0.20988225936889648 secondsTime to load utils op: 0.21443939208984375 seconds + 3: + 3: Time to load utils op: 0.21407151222229004 seconds + 3: +11: Time to load utils op: 0.21531248092651367 secondsTime to load utils op: 0.2153186798095703 secondsTime to load utils op: 0.21532702445983887 secondsTime to load utils op: 0.21532320976257324 seconds +11: +11: +11: +12: Time to load utils op: 0.2152564525604248 secondsTime to load utils op: 0.2152550220489502 seconds +12: +12: Time to load utils op: 0.215256929397583 secondsTime to load utils op: 0.2152552604675293 seconds +12: +15: Time to load utils op: 0.21504545211791992 secondsTime to load utils op: 0.21504616737365723 secondsTime to load utils op: 0.21504688262939453 seconds +15: Time to load utils op: 0.21504688262939453 seconds +15: +15: +42: Time to load utils op: 0.11951875686645508 secondsTime to load utils op: 0.1195213794708252 secondsTime to load utils op: 0.11952447891235352 seconds +42: +42: +42: Time to load utils op: 0.11952733993530273 seconds +38: Time to load utils op: 0.12091422080993652 secondsTime to load utils op: 0.12092161178588867 seconds +38: +38: Time to load utils op: 0.12092065811157227 seconds +38: Time to load utils op: 0.12093162536621094 seconds +16: Time to load utils op: 0.21546053886413574 secondsTime to load utils op: 0.2154674530029297 seconds +16: +16: Time to load utils op: 0.21535396575927734 seconds +16: Time to load utils op: 0.21547293663024902 seconds +13: Time to load utils op: 0.21621108055114746 secondsTime to load utils op: 0.21621394157409668 secondsTime to load utils op: 0.2162163257598877 secondsTime to load utils op: 0.21621012687683105 seconds +13: +13: +13: +26: Time to load utils op: 0.2169492244720459 secondsTime to load utils op: 0.21644377708435059 secondsTime to load utils op: 0.216994047164917 seconds +26: Time to load utils op: 0.2174382209777832 seconds +26: +26: +29: Time to load utils op: 0.21681642532348633 secondsTime to load utils op: 0.21633243560791016 secondsTime to load utils op: 0.21600031852722168 secondsTime to load utils op: 0.21597647666931152 seconds +29: +29: +29: +43: Time to load utils op: 0.12202000617980957 secondsTime to load utils op: 0.12202191352844238 seconds +43: +43: Time to load utils op: 0.12202835083007812 secondsTime to load utils op: 0.12202692031860352 seconds +43: +53: Time to load utils op: 0.12251853942871094 secondsTime to load utils op: 0.1233062744140625 secondsTime to load utils op: 0.12235641479492188 secondsTime to load utils op: 0.1235506534576416 seconds +53: +53: +53: +28: Time to load utils op: 0.21318364143371582 secondsTime to load utils op: 0.21318578720092773 seconds +28: +28: Time to load utils op: 0.21319365501403809 seconds +28: Time to load utils op: 0.21319580078125 seconds +14: Time to load utils op: 0.21973204612731934 secondsTime to load utils op: 0.21958470344543457 secondsTime to load utils op: 0.21973228454589844 secondsTime to load utils op: 0.21972990036010742 seconds +14: +14: +14: +21: Time to load utils op: 0.2166738510131836 secondsTime to load utils op: 0.21665740013122559 secondsTime to load utils op: 0.2166767120361328 secondsTime to load utils op: 0.21667242050170898 seconds +21: +21: +21: +18: Time to load utils op: 0.21840310096740723 secondsTime to load utils op: 0.2183840274810791 secondsTime to load utils op: 0.21840953826904297 seconds +18: +18: +18: Time to load utils op: 0.2184131145477295 seconds +23: Time to load utils op: 0.21552824974060059 secondsTime to load utils op: 0.2155284881591797 seconds +23: +23: Time to load utils op: 0.21551799774169922 secondsTime to load utils op: 0.2155303955078125 seconds +23: +17: Time to load utils op: 0.21668672561645508 secondsTime to load utils op: 0.21669483184814453 secondsTime to load utils op: 0.21669316291809082 seconds +17: +17: Time to load utils op: 0.2167072296142578 seconds +17: +45: Time to load utils op: 0.12360310554504395 secondsTime to load utils op: 0.12360692024230957 seconds +45: +45: Time to load utils op: 0.1236124038696289 secondsTime to load utils op: 0.12361550331115723 seconds +45: +27: Time to load utils op: 0.2135629653930664 secondsTime to load utils op: 0.21356534957885742 seconds +27: +27: Time to load utils op: 0.21356654167175293 seconds +27: Time to load utils op: 0.21354985237121582 seconds +22: Time to load utils op: 0.21715235710144043 secondsTime to load utils op: 0.2171475887298584 seconds +22: +22: Time to load utils op: 0.21715021133422852 seconds +22: Time to load utils op: 0.21715402603149414 seconds +30: Time to load utils op: 0.21368908882141113 secondsTime to load utils op: 0.2136838436126709 secondsTime to load utils op: 0.21369171142578125 seconds +30: +30: +30: Time to load utils op: 0.2136976718902588 seconds +31: Time to load utils op: 0.21332693099975586 secondsTime to load utils op: 0.21332502365112305 secondsTime to load utils op: 0.2133312225341797 seconds +31: +31: +31: Time to load utils op: 0.21332740783691406 seconds +24: Time to load utils op: 0.21549201011657715 secondsTime to load utils op: 0.21549296379089355 secondsTime to load utils op: 0.21549296379089355 secondsTime to load utils op: 0.21548986434936523 seconds +24: +24: +24: +20: Time to load utils op: 0.2189333438873291 seconds +20: Time to load utils op: 0.21894454956054688 secondsTime to load utils op: 0.2189493179321289 seconds +20: Time to load utils op: 0.21893954277038574 seconds +20: +19: Time to load utils op: 0.2197132110595703 secondsTime to load utils op: 0.2197132110595703 secondsTime to load utils op: 0.21971678733825684 seconds +19: +19: +19: Time to load utils op: 0.2197251319885254 seconds +47: Time to load utils op: 0.12522029876708984 secondsTime to load utils op: 0.12522053718566895 secondsTime to load utils op: 0.12522220611572266 seconds +47: +47: +47: Time to load utils op: 0.1252303123474121 seconds +25: Time to load utils op: 0.21711039543151855 secondsTime to load utils op: 0.21702837944030762 seconds +25: +25: Time to load utils op: 0.21712064743041992 secondsTime to load utils op: 0.21711516380310059 seconds +25: +56: Time to load utils op: 0.12531256675720215 secondsTime to load utils op: 0.1250455379486084 secondsTime to load utils op: 0.12381672859191895 secondsTime to load utils op: 0.1238706111907959 seconds +56: +56: +56: +57: Time to load utils op: 0.12793540954589844 secondsTime to load utils op: 0.12781190872192383 seconds +57: +57: Time to load utils op: 0.12757349014282227 seconds +57: Time to load utils op: 0.12796902656555176 seconds +54: Time to load utils op: 0.12355661392211914 secondsTime to load utils op: 0.12356400489807129 seconds +54: Time to load utils op: 0.12339997291564941 seconds +54: +54: Time to load utils op: 0.12355709075927734 seconds +46: Time to load utils op: 0.1266477108001709 seconds +46: Time to load utils op: 0.1266491413116455 secondsTime to load utils op: 0.12665081024169922 secondsTime to load utils op: 0.12664389610290527 seconds +46: +46: +48: Time to load utils op: 0.12511849403381348 secondsTime to load utils op: 0.12531781196594238 seconds +48: +48: Time to load utils op: 0.12532472610473633 secondsTime to load utils op: 0.12531709671020508 seconds +48: +52: Time to load utils op: 0.12439513206481934 secondsTime to load utils op: 0.1240091323852539 secondsTime to load utils op: 0.12439918518066406 seconds +52: +52: Time to load utils op: 0.12440371513366699 seconds +52: +55: Time to load utils op: 0.12278056144714355 secondsTime to load utils op: 0.12278294563293457 secondsTime to load utils op: 0.12278532981872559 seconds +55: +55: +55: Time to load utils op: 0.12266016006469727 seconds +49: Time to load utils op: 0.12415266036987305 secondsTime to load utils op: 0.12415385246276855 seconds +49: +49: Time to load utils op: 0.1241612434387207 seconds +49: Time to load utils op: 0.12390875816345215 seconds +51: Time to load utils op: 0.12477254867553711 secondsTime to load utils op: 0.12476778030395508 secondsTime to load utils op: 0.12476992607116699 seconds +51: +51: +51: Time to load utils op: 0.12476801872253418 seconds +61: Time to load utils op: 0.12140250205993652 secondsTime to load utils op: 0.12136292457580566 seconds +61: +61: Time to load utils op: 0.12142372131347656 secondsTime to load utils op: 0.12142825126647949 seconds +61: +63: Time to load utils op: 0.11993122100830078 secondsTime to load utils op: 0.1199336051940918 secondsTime to load utils op: 0.11993551254272461 secondsTime to load utils op: 0.1199331283569336 seconds +63: +63: +63: +60: Time to load utils op: 0.11957621574401855 seconds +60: Time to load utils op: 0.11957621574401855 secondsTime to load utils op: 0.11958527565002441 seconds +60: +60: Time to load utils op: 0.11959433555603027 seconds +50: Time to load utils op: 0.12274408340454102 secondsTime to load utils op: 0.12274169921875 seconds +50: +50: Time to load utils op: 0.12276554107666016 secondsTime to load utils op: 0.12275195121765137 seconds +50: +59: Time to load utils op: 0.12237215042114258 secondsTime to load utils op: 0.1222074031829834 secondsTime to load utils op: 0.12238168716430664 seconds +59: +59: +59: Time to load utils op: 0.12238740921020508 seconds +58: Time to load utils op: 0.12341475486755371 secondsTime to load utils op: 0.12341952323913574 secondsTime to load utils op: 0.12342095375061035 secondsTime to load utils op: 0.12342143058776855 seconds +58: +58: +58: +62: Time to load utils op: 0.12046027183532715 secondsTime to load utils op: 0.1204535961151123 secondsTime to load utils op: 0.1204688549041748 seconds +62: +62: Time to load utils op: 0.12041783332824707 seconds +62: + 0: Time to load utils op: 0.0007140636444091797 seconds + 0: Time to load utils op: 0.0007331371307373047 seconds + 0: Time to load utils op: 0.0006430149078369141 seconds +33: Time to load utils op: 0.0010361671447753906 seconds +33: Time to load utils op: 0.0010216236114501953 seconds +33: Time to load utils op: 0.0009095668792724609 seconds +33: Time to load utils op: 0.0010607242584228516 seconds + 6: Time to load utils op: 0.0008184909820556641 seconds + 6: Time to load utils op: 0.0009317398071289062 secondsTime to load utils op: 0.0009179115295410156 seconds + 6: + 6: Time to load utils op: 0.0008990764617919922 seconds +43: Time to load utils op: 0.0007839202880859375 seconds +43: Time to load utils op: 0.0008378028869628906 seconds +43: Time to load utils op: 0.000823974609375 seconds +43: Time to load utils op: 0.0008723735809326172 seconds + 5: Time to load utils op: 0.0008726119995117188 seconds + 5: Time to load utils op: 0.0008985996246337891 seconds + 5: Time to load utils op: 0.0009407997131347656 seconds +32: Time to load utils op: 0.0005490779876708984 seconds +32: Time to load utils op: 0.0005481243133544922 seconds +32: Time to load utils op: 0.0005743503570556641 seconds +32: Time to load utils op: 0.0005555152893066406 seconds + 5: Time to load utils op: 0.0009257793426513672 seconds + 8: Time to load utils op: 0.000926971435546875 seconds + 8: Time to load utils op: 0.0009174346923828125 seconds + 8: Time to load utils op: 0.0009093284606933594 seconds + 8: Time to load utils op: 0.0009775161743164062 seconds +56: Time to load utils op: 0.0006914138793945312 seconds +56: Time to load utils op: 0.0008077621459960938 secondsTime to load utils op: 0.0008375644683837891 seconds +56: +56: Time to load utils op: 0.0011086463928222656 seconds +39: Time to load utils op: 0.0009329319000244141 seconds +39: Time to load utils op: 0.0008797645568847656 seconds +39: Time to load utils op: 0.0009133815765380859 seconds +39: Time to load utils op: 0.000949859619140625 seconds +57: Time to load utils op: 0.0009326934814453125 secondsTime to load utils op: 0.0008919239044189453 seconds +57: +57: Time to load utils op: 0.0009102821350097656 seconds +57: Time to load utils op: 0.0009119510650634766 seconds +18: Time to load utils op: 0.0008826255798339844 seconds +18: Time to load utils op: 0.001009225845336914 seconds +18: Time to load utils op: 0.0009496212005615234 seconds +18: Time to load utils op: 0.001041412353515625 seconds +16: Time to load utils op: 0.0009410381317138672 secondsTime to load utils op: 0.0009343624114990234 seconds +16: +16: Time to load utils op: 0.0009026527404785156 seconds +16: Time to load utils op: 0.0009481906890869141 seconds + 4: Time to load utils op: 0.0007541179656982422 seconds +41: Time to load utils op: 0.000850677490234375 seconds + 4: Time to load utils op: 0.0009889602661132812 seconds +41: Time to load utils op: 0.0009551048278808594 seconds + 4: Time to load utils op: 0.00099945068359375 seconds +41: Time to load utils op: 0.0010342597961425781 seconds + 4: Time to load utils op: 0.0010247230529785156 seconds +41: Time to load utils op: 0.0010631084442138672 seconds + 9: Time to load utils op: 0.00093841552734375 seconds + 9: Time to load utils op: 0.0009608268737792969 seconds + 9: Time to load utils op: 0.0009276866912841797 seconds + 9: Time to load utils op: 0.0009770393371582031 seconds +31: Time to load utils op: 0.0010128021240234375 seconds +31: Time to load utils op: 0.0009610652923583984 secondsTime to load utils op: 0.0009374618530273438 seconds +31: +31: Time to load utils op: 0.0009827613830566406 seconds + 1: Time to load utils op: 0.0010519027709960938 seconds + 1: Time to load utils op: 0.0010387897491455078 seconds + 1: Time to load utils op: 0.0010552406311035156 seconds + 1: Time to load utils op: 0.0010683536529541016 seconds +42: Time to load utils op: 0.0008518695831298828 secondsTime to load utils op: 0.0008590221405029297 seconds +42: +42: Time to load utils op: 0.0007684230804443359 seconds +42: Time to load utils op: 0.0008559226989746094 seconds +34: Time to load utils op: 0.0007605552673339844 seconds +34: Time to load utils op: 0.0009012222290039062 seconds +34: Time to load utils op: 0.0008594989776611328 seconds +34: Time to load utils op: 0.0009071826934814453 seconds +13: Time to load utils op: 0.0006871223449707031 seconds +13: Time to load utils op: 0.0008418560028076172 seconds +13: Time to load utils op: 0.0009348392486572266 seconds + 2: Time to load utils op: 0.0010259151458740234 seconds +13: Time to load utils op: 0.0009613037109375 seconds +58: Time to load utils op: 0.0009293556213378906 seconds +58: Time to load utils op: 0.0009322166442871094 seconds + 2: Time to load utils op: 0.0011417865753173828 seconds +58: Time to load utils op: 0.0009162425994873047 seconds + 2: Time to load utils op: 0.0010955333709716797 seconds +44: Time to load utils op: 0.0009732246398925781 secondsTime to load utils op: 0.0009591579437255859 seconds +44: +44: Time to load utils op: 0.0009696483612060547 seconds +58: Time to load utils op: 0.0009675025939941406 seconds + 2: Time to load utils op: 0.0011684894561767578 seconds +44: Time to load utils op: 0.0010552406311035156 seconds +53: Time to load utils op: 0.000965118408203125 seconds +53: Time to load utils op: 0.0009922981262207031 seconds +53: Time to load utils op: 0.0009567737579345703 seconds +53: Time to load utils op: 0.0010302066802978516 seconds +45: Time to load utils op: 0.0009162425994873047 secondsTime to load utils op: 0.0008649826049804688 seconds +45: +45: Time to load utils op: 0.0008976459503173828 seconds +45: Time to load utils op: 0.0009531974792480469 seconds +21: Time to load utils op: 0.0005066394805908203 seconds +21: Time to load utils op: 0.0005085468292236328 secondsTime to load utils op: 0.0005080699920654297 secondsTime to load utils op: 0.0005209445953369141 seconds +21: +21: +25: Time to load utils op: 0.0008234977722167969 seconds +25: Time to load utils op: 0.0009353160858154297 seconds +25: Time to load utils op: 0.0009133815765380859 seconds +25: Time to load utils op: 0.0009937286376953125 seconds +46: Time to load utils op: 0.0008568763732910156 seconds +38: Time to load utils op: 0.0008862018585205078 seconds +46: Time to load utils op: 0.000978708267211914 seconds +46: Time to load utils op: 0.0009331703186035156 seconds +29: Time to load utils op: 0.0007109642028808594 seconds +38: Time to load utils op: 0.0010223388671875 seconds +46: Time to load utils op: 0.0009365081787109375 seconds +48: Time to load utils op: 0.0009946823120117188 seconds +48: Time to load utils op: 0.0010106563568115234 seconds +38: Time to load utils op: 0.0010139942169189453 seconds +48: Time to load utils op: 0.00096893310546875 seconds +38: Time to load utils op: 0.0010564327239990234 seconds +48: Time to load utils op: 0.000988006591796875 seconds +29: Time to load utils op: 0.0009484291076660156 secondsTime to load utils op: 0.0009243488311767578 seconds +29: +29: Time to load utils op: 0.0009696483612060547 seconds +59: Time to load utils op: 0.0009458065032958984 seconds +59: Time to load utils op: 0.0009367465972900391 secondsTime to load utils op: 0.0009386539459228516 seconds +59: +59: Time to load utils op: 0.0009982585906982422 seconds +49: Time to load utils op: 0.0007832050323486328 seconds +49: Time to load utils op: 0.0008554458618164062 seconds +49: Time to load utils op: 0.0008618831634521484 seconds +49: Time to load utils op: 0.0008990764617919922 seconds +60: Time to load utils op: 0.0009069442749023438 seconds +60: Time to load utils op: 0.0009067058563232422 seconds +60: Time to load utils op: 0.0009291172027587891 seconds +60: Time to load utils op: 0.0009291172027587891 seconds + 7: Time to load utils op: 0.0007092952728271484 seconds +62: Time to load utils op: 0.0008919239044189453 seconds +62: Time to load utils op: 0.0009238719940185547 seconds +62: Time to load utils op: 0.0009219646453857422 seconds +54: Time to load utils op: 0.0006597042083740234 seconds +62: Time to load utils op: 0.0009493827819824219 seconds + 7: Time to load utils op: 0.0008990764617919922 seconds +54: Time to load utils op: 0.0006690025329589844 seconds + 7: Time to load utils op: 0.0008509159088134766 seconds + 7: Time to load utils op: 0.000896453857421875 seconds +54: Time to load utils op: 0.0008444786071777344 seconds +15: Time to load utils op: 0.0009043216705322266 seconds +54: Time to load utils op: 0.0009818077087402344 seconds +15: Time to load utils op: 0.0009789466857910156 secondsTime to load utils op: 0.0009336471557617188 seconds +15: +15: Time to load utils op: 0.0010159015655517578 seconds +22: Time to load utils op: 0.0009353160858154297 secondsTime to load utils op: 0.0009140968322753906 secondsTime to load utils op: 0.0009415149688720703 seconds +22: +22: +22: Time to load utils op: 0.0009527206420898438 seconds +52: Time to load utils op: 0.0009207725524902344 secondsTime to load utils op: 0.0009491443634033203 secondsTime to load utils op: 0.0009431838989257812 seconds +52: +52: +52: Time to load utils op: 0.0009188652038574219 seconds +50: Time to load utils op: 0.0009124279022216797 seconds +50: Time to load utils op: 0.00092315673828125 seconds +50: Time to load utils op: 0.0009138584136962891 seconds +50: Time to load utils op: 0.0009715557098388672 seconds +12: Time to load utils op: 0.0009706020355224609 seconds +12: Time to load utils op: 0.0009903907775878906 seconds +12: Time to load utils op: 0.001003265380859375 seconds +12: Time to load utils op: 0.0010340213775634766 seconds +17: Time to load utils op: 0.0008616447448730469 secondsTime to load utils op: 0.0007505416870117188 seconds +17: +17: Time to load utils op: 0.00069427490234375 seconds +35: Time to load utils op: 0.0007727146148681641 seconds +17: Time to load utils op: 0.0009076595306396484 seconds +35: Time to load utils op: 0.0009007453918457031 seconds +35: Time to load utils op: 0.000911712646484375 seconds +35: Time to load utils op: 0.0009315013885498047 seconds +51: Time to load utils op: 0.0007343292236328125 seconds +51: Time to load utils op: 0.0009832382202148438 secondsTime to load utils op: 0.001005411148071289 seconds +51: +51: Time to load utils op: 0.0010581016540527344 seconds +47: Time to load utils op: 0.0009486675262451172 secondsTime to load utils op: 0.0009322166442871094 secondsTime to load utils op: 0.0009377002716064453 seconds +47: +47: +23: Time to load utils op: 0.0010213851928710938 seconds +47: Time to load utils op: 0.0009768009185791016 seconds +23: Time to load utils op: 0.0011649131774902344 secondsTime to load utils op: 0.0011494159698486328 seconds +23: +37: Time to load utils op: 0.0007028579711914062 seconds +23: Time to load utils op: 0.0012116432189941406 seconds +37: Time to load utils op: 0.0008308887481689453 seconds +37: Time to load utils op: 0.0008456707000732422 seconds +37: Time to load utils op: 0.0008966922760009766 seconds +63: Time to load utils op: 0.001026153564453125 seconds +63: Time to load utils op: 0.0010433197021484375 seconds +63: Time to load utils op: 0.0010116100311279297 seconds +63: Time to load utils op: 0.0011053085327148438 seconds +14: Time to load utils op: 0.0009887218475341797 seconds +14: Time to load utils op: 0.000978708267211914 seconds +14: Time to load utils op: 0.0009856224060058594 seconds +14: Time to load utils op: 0.0010449886322021484 seconds + 3: Time to load utils op: 0.0005104541778564453 seconds + 3: Time to load utils op: 0.00042629241943359375 seconds + 3: Time to load utils op: 0.0004456043243408203 seconds + 3: Time to load utils op: 0.0005023479461669922 seconds +40: Time to load utils op: 0.0008637905120849609 secondsTime to load utils op: 0.0008509159088134766 secondsTime to load utils op: 0.0008542537689208984 seconds +40: +40: +40: Time to load utils op: 0.0008702278137207031 seconds +10: Time to load utils op: 0.0008053779602050781 seconds +10: Time to load utils op: 0.0008146762847900391 secondsTime to load utils op: 0.0008041858673095703 seconds +10: +10: Time to load utils op: 0.0008943080902099609 seconds + 0: [2023-04-29 11:26:34,866] [INFO] [utils.py:827:see_memory_usage] before initializing group 0 + 0: [2023-04-29 11:26:34,867] [INFO] [utils.py:828:see_memory_usage] MA 4.15 GB Max_MA 4.15 GB CA 4.18 GB Max_CA 4 GB + 0: [2023-04-29 11:26:34,867] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.84 GB, percent = 7.9% +11: Time to load utils op: 0.0008406639099121094 seconds +11: Time to load utils op: 0.0009503364562988281 secondsTime to load utils op: 0.0009469985961914062 seconds +11: +11: Time to load utils op: 0.0010077953338623047 seconds +26: Time to load utils op: 0.0008237361907958984 seconds +26: Time to load utils op: 0.0008432865142822266 secondsTime to load utils op: 0.0008244514465332031 seconds +26: +26: Time to load utils op: 0.0009024143218994141 seconds +24: Time to load utils op: 0.0008382797241210938 seconds +24: Time to load utils op: 0.0009167194366455078 seconds +24: Time to load utils op: 0.0008597373962402344 seconds +24: Time to load utils op: 0.000978708267211914 seconds +27: Time to load utils op: 0.0007889270782470703 seconds +20: Time to load utils op: 0.0007510185241699219 seconds +27: Time to load utils op: 0.0009086132049560547 secondsTime to load utils op: 0.0008933544158935547 seconds +27: +27: Time to load utils op: 0.0009074211120605469 seconds +20: Time to load utils op: 0.0009524822235107422 seconds +20: Time to load utils op: 0.0009393692016601562 seconds +20: Time to load utils op: 0.0009129047393798828 seconds +28: Time to load utils op: 0.0005967617034912109 seconds +28: Time to load utils op: 0.0006573200225830078 seconds +28: Time to load utils op: 0.0007028579711914062 seconds +36: Time to load utils op: 0.0009095668792724609 seconds +28: Time to load utils op: 0.00086212158203125 seconds +55: Time to load utils op: 0.000705718994140625 seconds +36: Time to load utils op: 0.0010824203491210938 secondsTime to load utils op: 0.0010561943054199219 seconds +36: +36: Time to load utils op: 0.0010764598846435547 seconds +61: Time to load utils op: 0.0010526180267333984 seconds +61: Time to load utils op: 0.001046895980834961 seconds +55: Time to load utils op: 0.0009930133819580078 secondsTime to load utils op: 0.000997304916381836 seconds +55: +61: Time to load utils op: 0.0010323524475097656 seconds +55: Time to load utils op: 0.0010347366333007812 seconds +61: Time to load utils op: 0.0010633468627929688 seconds +30: Time to load utils op: 0.0009884834289550781 secondsTime to load utils op: 0.0009503364562988281 secondsTime to load utils op: 0.0009350776672363281 seconds +30: +30: +30: Time to load utils op: 0.000985860824584961 seconds +19: Time to load utils op: 0.0008406639099121094 seconds +19: Time to load utils op: 0.0009214878082275391 seconds +19: Time to load utils op: 0.0008692741394042969 seconds +19: Time to load utils op: 0.00093841552734375 seconds + 0: [2023-04-29 11:26:34,993] [INFO] [utils.py:827:see_memory_usage] after initializing group 0 + 0: [2023-04-29 11:26:34,993] [INFO] [utils.py:828:see_memory_usage] MA 8.44 GB Max_MA 8.44 GB CA 10.57 GB Max_CA 11 GB + 0: [2023-04-29 11:26:34,994] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.91 GB, percent = 7.9% + 0: [2023-04-29 11:26:35,108] [INFO] [utils.py:827:see_memory_usage] before initializing group 1 + 0: [2023-04-29 11:26:35,109] [INFO] [utils.py:828:see_memory_usage] MA 8.44 GB Max_MA 8.44 GB CA 10.57 GB Max_CA 11 GB + 0: [2023-04-29 11:26:35,109] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.95 GB, percent = 7.9% + 0: [2023-04-29 11:26:35,228] [INFO] [utils.py:827:see_memory_usage] after initializing group 1 + 0: [2023-04-29 11:26:35,229] [INFO] [utils.py:828:see_memory_usage] MA 12.5 GB Max_MA 12.5 GB CA 16.62 GB Max_CA 17 GB + 0: [2023-04-29 11:26:35,229] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.94 GB, percent = 7.9% + 0: [2023-04-29 11:26:35,346] [INFO] [utils.py:827:see_memory_usage] before initializing group 2 + 0: [2023-04-29 11:26:35,346] [INFO] [utils.py:828:see_memory_usage] MA 12.5 GB Max_MA 12.5 GB CA 16.62 GB Max_CA 17 GB + 0: [2023-04-29 11:26:35,347] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 39.99 GB, percent = 7.9% + 0: [2023-04-29 11:26:35,466] [INFO] [utils.py:827:see_memory_usage] after initializing group 2 + 0: [2023-04-29 11:26:35,467] [INFO] [utils.py:828:see_memory_usage] MA 12.51 GB Max_MA 12.51 GB CA 16.62 GB Max_CA 17 GB + 0: [2023-04-29 11:26:35,467] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.04 GB, percent = 8.0% +32: ninja: no work to do. +32: Time to load utils op: 0.4123702049255371 seconds +48: Time to load utils op: 0.38137125968933105 seconds +48: Time to load utils op: 0.38496923446655273 seconds +48: Time to load utils op: 0.38884639739990234 seconds +48: Time to load utils op: 0.392056941986084 seconds + 0: [2023-04-29 11:26:35,585] [INFO] [utils.py:827:see_memory_usage] before initialize_optimizer + 0: [2023-04-29 11:26:35,585] [INFO] [utils.py:828:see_memory_usage] MA 12.51 GB Max_MA 12.51 GB CA 16.62 GB Max_CA 17 GB + 0: [2023-04-29 11:26:35,585] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.07 GB, percent = 8.0% +32: Time to load utils op: 0.41562795639038086 seconds +42: Time to load utils op: 0.4034445285797119 seconds +42: Time to load utils op: 0.40430688858032227 seconds +42: Time to load utils op: 0.4043235778808594 seconds +42: Time to load utils op: 0.4036295413970947 seconds +32: Time to load utils op: 0.4202749729156494 seconds +36: Time to load utils op: 0.42135143280029297 seconds +32: Time to load utils op: 0.42623424530029297 seconds +36: Time to load utils op: 0.42705750465393066 seconds +52: Time to load utils op: 0.41311001777648926 seconds +41: Time to load utils op: 0.4065234661102295 seconds +41: Time to load utils op: 0.4070451259613037 seconds +41: Time to load utils op: 0.4069392681121826 seconds +36: Time to load utils op: 0.4318816661834717 seconds +41: Time to load utils op: 0.41005611419677734 seconds +52: Time to load utils op: 0.4192533493041992 seconds +34: Time to load utils op: 0.40942931175231934 seconds +36: Time to load utils op: 0.4362602233886719 seconds +57: Time to load utils op: 0.4256103038787842 seconds +33: Time to load utils op: 0.4357597827911377 seconds +52: Time to load utils op: 0.4250786304473877 seconds +63: Time to load utils op: 0.4126262664794922 seconds +51: Time to load utils op: 0.40676355361938477 seconds +34: Time to load utils op: 0.41354894638061523 secondsTime to load utils op: 0.4135313034057617 seconds +34: +34: Time to load utils op: 0.41377830505371094 seconds +63: Time to load utils op: 0.4086489677429199 secondsTime to load utils op: 0.41259193420410156 seconds +63: +63: Time to load utils op: 0.4090547561645508 seconds +57: Time to load utils op: 0.4301872253417969 seconds +37: Time to load utils op: 0.3976767063140869 seconds +53: Time to load utils op: 0.43210816383361816 seconds +33: Time to load utils op: 0.4405782222747803 seconds +60: Time to load utils op: 0.3962874412536621 seconds +40: Time to load utils op: 0.4185009002685547 seconds +54: Time to load utils op: 0.42044568061828613 seconds +46: Time to load utils op: 0.37775397300720215 seconds +46: Time to load utils op: 0.3922257423400879 seconds +46: Time to load utils op: 0.37824225425720215 seconds +57: Time to load utils op: 0.43416786193847656 seconds +46: Time to load utils op: 0.37832140922546387 seconds +52: Time to load utils op: 0.43184757232666016 seconds +56: Time to load utils op: 0.4332282543182373 seconds +45: Time to load utils op: 0.3889937400817871 seconds +44: Time to load utils op: 0.41966843605041504 seconds +60: Time to load utils op: 0.3993973731994629 seconds +55: Time to load utils op: 0.3801121711730957 seconds +37: Time to load utils op: 0.41786670684814453 seconds +51: Time to load utils op: 0.43163156509399414 seconds +49: Time to load utils op: 0.39755916595458984 seconds +33: Time to load utils op: 0.4471902847290039 seconds +53: Time to load utils op: 0.43677639961242676 seconds +51: Time to load utils op: 0.415846586227417 seconds +57: Time to load utils op: 0.438762903213501 seconds +40: Time to load utils op: 0.42453694343566895 seconds +45: Time to load utils op: 0.38271403312683105 seconds +54: Time to load utils op: 0.4260690212249756 seconds +62: Time to load utils op: 0.39653944969177246 seconds +50: Time to load utils op: 0.3801002502441406 seconds +60: Time to load utils op: 0.4020881652832031 seconds +61: Time to load utils op: 0.4012444019317627 seconds +37: Time to load utils op: 0.4069790840148926 seconds +56: Time to load utils op: 0.43912601470947266 seconds +33: Time to load utils op: 0.45186805725097656 seconds +44: Time to load utils op: 0.4258708953857422 seconds +44: Time to load utils op: 0.4263925552368164 secondsTime to load utils op: 0.42639875411987305 seconds +44: +50: Time to load utils op: 0.3822624683380127 seconds +61: Time to load utils op: 0.38561558723449707 seconds +45: Time to load utils op: 0.3860461711883545 seconds +50: Time to load utils op: 0.382354736328125 secondsTime to load utils op: 0.3823821544647217 seconds +50: +38: Time to load utils op: 0.3984055519104004 seconds +37: Time to load utils op: 0.4105203151702881 seconds +45: Time to load utils op: 0.38667798042297363 seconds +49: Time to load utils op: 0.40279603004455566 seconds +55: Time to load utils op: 0.38634324073791504 seconds +35: Time to load utils op: 0.386096715927124 seconds +53: Time to load utils op: 0.4421355724334717 seconds +51: Time to load utils op: 0.4257316589355469 seconds +40: Time to load utils op: 0.430614709854126 seconds +60: Time to load utils op: 0.4093625545501709 seconds +38: Time to load utils op: 0.38314247131347656 seconds +38: Time to load utils op: 0.3835902214050293 secondsTime to load utils op: 0.38359761238098145 seconds +38: +62: Time to load utils op: 0.4029195308685303 seconds +40: Time to load utils op: 0.4321708679199219 seconds +35: Time to load utils op: 0.3888587951660156 seconds +54: Time to load utils op: 0.4338569641113281 seconds +61: Time to load utils op: 0.39043736457824707 seconds +56: Time to load utils op: 0.4454352855682373 seconds +53: Time to load utils op: 0.4444398880004883 seconds +39: Time to load utils op: 0.4560565948486328 seconds +39: Time to load utils op: 0.4560990333557129 seconds +58: Time to load utils op: 0.3836972713470459 seconds +39: Time to load utils op: 0.456693172454834 secondsTime to load utils op: 0.4565591812133789 seconds +39: +59: Time to load utils op: 0.36692285537719727 seconds +54: Time to load utils op: 0.43558287620544434 seconds +55: Time to load utils op: 0.39177918434143066 seconds +49: Time to load utils op: 0.40845274925231934 seconds +63: Time to load utils op: 0.0035893917083740234 seconds +43: Time to load utils op: 0.37378907203674316 seconds +49: Time to load utils op: 0.41087889671325684 seconds +61: Time to load utils op: 0.39547061920166016 seconds +62: Time to load utils op: 0.42266201972961426 seconds +35: Time to load utils op: 0.394930362701416 seconds +56: Time to load utils op: 0.451082706451416 seconds +58: Time to load utils op: 0.38981199264526367 seconds +59: Time to load utils op: 0.3734147548675537 seconds +47: Time to load utils op: 0.3812999725341797 seconds +55: Time to load utils op: 0.4071342945098877 seconds +43: Time to load utils op: 0.379838228225708 seconds +35: Time to load utils op: 0.4003474712371826 seconds +34: Time to load utils op: 0.0014843940734863281 secondsTime to load utils op: 0.0015425682067871094 seconds +34: Time to load utils op: 0.0012443065643310547 seconds +34: +34: Time to load utils op: 0.002111673355102539 seconds +62: Time to load utils op: 0.416579008102417 seconds +58: Time to load utils op: 0.41138291358947754 seconds +47: Time to load utils op: 0.38717103004455566 seconds +59: Time to load utils op: 0.37927699089050293 seconds +47: Time to load utils op: 0.389070987701416 seconds +43: Time to load utils op: 0.38570618629455566 seconds +58: Time to load utils op: 0.399005651473999 seconds +47: Time to load utils op: 0.3920295238494873 seconds +59: Time to load utils op: 0.40099191665649414 seconds +43: Time to load utils op: 0.39188170433044434 seconds +44: Time to load utils op: 0.003526449203491211 seconds +41: Time to load utils op: 0.0023932456970214844 seconds +41: Time to load utils op: 0.002180337905883789 seconds +41: Time to load utils op: 0.0018711090087890625 seconds +41: Time to load utils op: 0.0022826194763183594 seconds +39: Time to load utils op: 0.010691642761230469 seconds +39: Time to load utils op: 0.010733604431152344 seconds +44: Time to load utils op: 0.0061779022216796875 secondsTime to load utils op: 0.006392240524291992 seconds +44: +44: Time to load utils op: 0.0065157413482666016 seconds +51: Time to load utils op: 0.005183696746826172 seconds +51: Time to load utils op: 0.005352020263671875 seconds +51: Time to load utils op: 0.00518035888671875 seconds +51: Time to load utils op: 0.0055005550384521484 seconds +60: Time to load utils op: 0.0034172534942626953 seconds +60: Time to load utils op: 0.0034818649291992188 seconds +60: Time to load utils op: 0.003360271453857422 seconds +60: Time to load utils op: 0.003385782241821289 seconds +32: Time to load utils op: 0.0052416324615478516 seconds +37: Time to load utils op: 0.0005307197570800781 seconds +37: Time to load utils op: 0.00035881996154785156 seconds +37: Time to load utils op: 0.00048470497131347656 seconds +37: Time to load utils op: 0.00037980079650878906 seconds +32: Time to load utils op: 0.0004112720489501953 seconds +32: Time to load utils op: 0.0003764629364013672 seconds +32: Time to load utils op: 0.0003132820129394531 seconds +50: Time to load utils op: 0.0048160552978515625 seconds +50: Time to load utils op: 0.0048065185546875 seconds +50: Time to load utils op: 0.005898475646972656 seconds +50: Time to load utils op: 0.00458979606628418 seconds +36: Time to load utils op: 0.004426717758178711 seconds +36: Time to load utils op: 0.0045795440673828125 seconds +36: Time to load utils op: 0.004610776901245117 seconds +36: Time to load utils op: 0.0037157535552978516 seconds +39: Time to load utils op: 0.0004820823669433594 seconds +38: Time to load utils op: 0.004026651382446289 seconds +38: Time to load utils op: 0.0003707408905029297 seconds +38: Time to load utils op: 0.00034499168395996094 seconds +63: Time to load utils op: 0.0003426074981689453 seconds +54: Time to load utils op: 0.007875442504882812 seconds +63: Time to load utils op: 0.00045609474182128906 seconds +63: Time to load utils op: 0.0004076957702636719 seconds +53: Time to load utils op: 0.004265785217285156 secondsTime to load utils op: 0.004118680953979492 seconds +53: +38: Time to load utils op: 0.0003631114959716797 seconds +54: Time to load utils op: 0.00036907196044921875 secondsTime to load utils op: 0.00038051605224609375 seconds +54: +54: Time to load utils op: 0.00035452842712402344 seconds +39: Time to load utils op: 0.00044655799865722656 seconds +46: Time to load utils op: 0.0006296634674072266 seconds +46: Time to load utils op: 0.0004909038543701172 seconds +46: Time to load utils op: 0.00036334991455078125 secondsTime to load utils op: 0.0003628730773925781 seconds +46: +47: Time to load utils op: 0.005010128021240234 seconds +55: Time to load utils op: 0.0036323070526123047 secondsTime to load utils op: 0.0036134719848632812 seconds +55: +55: Time to load utils op: 0.0035958290100097656 seconds +55: Time to load utils op: 0.00359344482421875 seconds +47: Time to load utils op: 0.0004551410675048828 seconds +47: Time to load utils op: 0.0004265308380126953 seconds +40: Time to load utils op: 0.0004811286926269531 seconds +40: Time to load utils op: 0.00039196014404296875 seconds +40: Time to load utils op: 0.00035643577575683594 secondsTime to load utils op: 0.00037097930908203125 seconds +40: +53: Time to load utils op: 0.0004658699035644531 secondsTime to load utils op: 0.0004303455352783203 seconds +53: +48: Time to load utils op: 0.00475621223449707 seconds +48: Time to load utils op: 0.004374027252197266 seconds +48: Time to load utils op: 0.002386808395385742 seconds +48: Time to load utils op: 0.0003466606140136719 seconds +47: Time to load utils op: 0.00043463706970214844 seconds +45: Time to load utils op: 0.00518345832824707 seconds +45: Time to load utils op: 0.005346536636352539 seconds +45: Time to load utils op: 0.0048792362213134766 seconds +45: Time to load utils op: 0.0004665851593017578 seconds +35: Time to load utils op: 0.0022995471954345703 seconds +35: Time to load utils op: 0.002477407455444336 seconds +35: Time to load utils op: 0.0022792816162109375 seconds +42: Time to load utils op: 0.0041882991790771484 seconds +42: Time to load utils op: 0.006356716156005859 secondsTime to load utils op: 0.004556417465209961 secondsTime to load utils op: 0.0062749385833740234 seconds +42: +42: +35: Time to load utils op: 0.000431060791015625 seconds +33: Time to load utils op: 0.0012607574462890625 seconds +33: Time to load utils op: 0.00037217140197753906 seconds +33: Time to load utils op: 0.00036334991455078125 seconds +33: Time to load utils op: 0.0003533363342285156 seconds +49: Time to load utils op: 0.004974365234375 seconds +49: Time to load utils op: 0.004663944244384766 seconds +49: Time to load utils op: 0.004605531692504883 seconds +49: Time to load utils op: 0.0060062408447265625 seconds +57: Time to load utils op: 0.013193845748901367 seconds +57: Time to load utils op: 0.013174772262573242 secondsTime to load utils op: 0.013231039047241211 seconds +57: +57: Time to load utils op: 0.01301717758178711 seconds +62: Time to load utils op: 0.005958080291748047 seconds +62: Time to load utils op: 0.005541801452636719 seconds +62: Time to load utils op: 0.005437135696411133 secondsTime to load utils op: 0.005484104156494141 seconds +62: + 0: [2023-04-29 11:26:35,910] [INFO] [utils.py:827:see_memory_usage] end initialize_optimizer + 0: [2023-04-29 11:26:35,910] [INFO] [utils.py:828:see_memory_usage] MA 12.64 GB Max_MA 12.64 GB CA 16.62 GB Max_CA 17 GB + 0: [2023-04-29 11:26:35,911] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.19 GB, percent = 8.0% +59: Time to load utils op: 0.0038971900939941406 seconds +59: Time to load utils op: 0.009067773818969727 seconds +59: Time to load utils op: 0.009087324142456055 seconds +59: Time to load utils op: 0.00952291488647461 seconds +61: Time to load utils op: 0.006440877914428711 secondsTime to load utils op: 0.0063953399658203125 seconds +61: +61: Time to load utils op: 0.008565187454223633 seconds +61: Time to load utils op: 0.013497352600097656 seconds +52: Time to load utils op: 0.009844779968261719 seconds +58: Time to load utils op: 0.013693571090698242 seconds +58: Time to load utils op: 0.016798734664916992 seconds + 0: [2023-04-29 11:26:36,035] [INFO] [utils.py:827:see_memory_usage] end bf16_optimizer + 0: [2023-04-29 11:26:36,036] [INFO] [utils.py:828:see_memory_usage] MA 12.64 GB Max_MA 12.64 GB CA 16.62 GB Max_CA 17 GB + 0: [2023-04-29 11:26:36,036] [INFO] [utils.py:836:see_memory_usage] CPU Virtual Memory: used = 40.22 GB, percent = 8.0% + 0: [2023-04-29 11:26:36,036] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed Final Optimizer = FusedAdam + 0: [2023-04-29 11:26:36,036] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed using client LR scheduler + 0: [2023-04-29 11:26:36,036] [INFO] [logging.py:68:log_dist] [Rank 0] DeepSpeed LR Scheduler = + 0: [2023-04-29 11:26:36,036] [INFO] [logging.py:68:log_dist] [Rank 0] step=0, skipped=0, lr=[0.0002, 0.0002, 0.0002], mom=[(0.9, 0.999), (0.9, 0.999), (0.9, 0.999)] + 0: [2023-04-29 11:26:36,037] [INFO] [config.py:1007:print] DeepSpeedEngine configuration: + 0: [2023-04-29 11:26:36,037] [INFO] [config.py:1011:print] activation_checkpointing_config { + 0: "partition_activations": false, + 0: "contiguous_memory_optimization": false, + 0: "cpu_checkpointing": false, + 0: "number_checkpoints": null, + 0: "synchronize_checkpoint_boundary": false, + 0: "profile": false + 0: } + 0: [2023-04-29 11:26:36,037] [INFO] [config.py:1011:print] aio_config ................... {'block_size': 1048576, 'queue_depth': 8, 'thread_count': 1, 'single_submit': False, 'overlap_events': True} + 0: [2023-04-29 11:26:36,037] [INFO] [config.py:1011:print] amp_enabled .................. False + 0: [2023-04-29 11:26:36,037] [INFO] [config.py:1011:print] amp_params ................... False + 0: [2023-04-29 11:26:36,037] [INFO] [config.py:1011:print] autotuning_config ............ { + 0: "enabled": false, + 0: "start_step": null, + 0: "end_step": null, + 0: "metric_path": null, + 0: "arg_mappings": null, + 0: "metric": "throughput", + 0: "model_info": null, + 0: "results_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_results", + 0: "exps_dir": "/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/autotuning_exps", + 0: "overwrite": true, + 0: "fast": true, + 0: "start_profile_step": 3, + 0: "end_profile_step": 5, + 0: "tuner_type": "gridsearch", + 0: "tuner_early_stopping": 5, + 0: "tuner_num_trials": 50, + 0: "model_info_path": null, + 0: "mp_size": 1, + 0: "max_train_batch_size": null, + 0: "min_train_batch_size": 1, + 0: "max_train_micro_batch_size_per_gpu": 1.024000e+03, + 0: "min_train_micro_batch_size_per_gpu": 1, + 0: "num_tuning_micro_batch_sizes": 3 + 0: } + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] bfloat16_enabled ............. True + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] checkpoint_parallel_write_pipeline False + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] checkpoint_tag_validation_enabled True + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] checkpoint_tag_validation_fail False +58: Time to load utils op: 0.016407251358032227 secondsTime to load utils op: 0.016391754150390625 seconds +58: + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] comms_config ................. + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] communication_data_type ...... None + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] compression_config ........... {'weight_quantization': {'shared_parameters': {'enabled': False, 'quantizer_kernel': False, 'schedule_offset': 0, 'quantize_groups': 1, 'quantize_verbose': False, 'quantization_type': 'symmetric', 'quantize_weight_in_forward': False, 'rounding': 'nearest', 'fp16_mixed_quantize': False, 'quantize_change_ratio': 0.001}, 'different_groups': {}}, 'activation_quantization': {'shared_parameters': {'enabled': False, 'quantization_type': 'symmetric', 'range_calibration': 'dynamic', 'schedule_offset': 1000}, 'different_groups': {}}, 'sparse_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'row_pruning': {'shared_parameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'head_pruning': {'shared_parameters': {'enabled': False, 'method': 'topk', 'schedule_offset': 1000}, 'different_groups': {}}, 'channel_pruning': {'shared_pa + 0: rameters': {'enabled': False, 'method': 'l1', 'schedule_offset': 1000}, 'different_groups': {}}, 'layer_reduction': {'enabled': False}} + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] curriculum_enabled ........... False + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] curriculum_params ............ False + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] dataloader_drop_last ......... False + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] disable_allgather ............ False + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] dump_state ................... False + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] dynamic_loss_scale_args ...... None + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] eigenvalue_enabled ........... False + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] eigenvalue_gas_boundary_resolution 1 + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] eigenvalue_layer_name ........ bert.encoder.layer + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] eigenvalue_layer_num ......... 0 + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] eigenvalue_max_iter .......... 100 + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] eigenvalue_stability ......... 1e-06 + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] eigenvalue_tol ............... 0.01 + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] eigenvalue_verbose ........... False + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] elasticity_enabled ........... False + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] flops_profiler_config ........ { + 0: "enabled": false, + 0: "profile_step": 1, + 0: "module_depth": -1, + 0: "top_modules": 1, + 0: "detailed": true, + 0: "output_file": null + 0: } + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] fp16_auto_cast ............... None + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] fp16_enabled ................. False + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] fp16_master_weights_and_gradients False + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] global_rank .................. 0 + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] gradient_accumulation_steps .. 4 + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] gradient_clipping ............ 1.0 + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] gradient_predivide_factor .... 1.0 + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] initial_dynamic_scale ........ 1 + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] load_universal_checkpoint .... False + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] loss_scale ................... 1.0 + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] memory_breakdown ............. False + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] monitor_config ............... + 0: [2023-04-29 11:26:36,038] [INFO] [config.py:1011:print] nebula_config ................ { + 0: "enabled": false, + 0: "persistent_storage_path": null, + 0: "persistent_time_interval": 100, + 0: "num_of_version_in_retention": 2, + 0: "enable_nebula_load": true, + 0: "load_path": null + 0: } + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] optimizer_legacy_fusion ...... False + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] optimizer_name ............... None + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] optimizer_params ............. None + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] pipeline ..................... {'stages': 'auto', 'partition': 'best', 'seed_layers': False, 'activation_checkpoint_interval': 0} + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] pld_enabled .................. False + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] pld_params ................... False + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] prescale_gradients ........... False + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] scheduler_name ............... None + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] scheduler_params ............. None + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] sparse_attention ............. None + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] sparse_gradients_enabled ..... False + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] steps_per_print .............. 2000 + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] train_batch_size ............. 512 + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] train_micro_batch_size_per_gpu 1 + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] use_node_local_storage ....... False + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] wall_clock_breakdown ......... False + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] world_size ................... 128 + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] zero_allow_untested_optimizer False +52: Time to load utils op: 0.01866626739501953 seconds + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] zero_config .................. stage=0 contiguous_gradients=True reduce_scatter=True reduce_bucket_size=500000000 allgather_partitions=True allgather_bucket_size=500000000 overlap_comm=False load_from_fp32_weights=True elastic_checkpoint=False offload_param=None offload_optimizer=None sub_group_size=1000000000 cpu_offload_param=None cpu_offload_use_pin_memory=None cpu_offload=None prefetch_bucket_size=50000000 param_persistence_threshold=100000 model_persistence_threshold=9223372036854775807 max_live_parameters=1000000000 max_reuse_distance=1000000000 gather_16bit_weights_on_model_save=False stage3_gather_fp16_weights_on_model_save=False ignore_unused_parameters=True legacy_stage1=False round_robin_gradients=False + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] zero_enabled ................. False + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:1011:print] zero_optimization_stage ...... 0 + 0: [2023-04-29 11:26:36,039] [INFO] [config.py:996:print_user_config] json = { + 0: "train_micro_batch_size_per_gpu": 1, + 0: "train_batch_size": 512, + 0: "gradient_clipping": 1.0, + 0: "zero_optimization": { + 0: "stage": 0 + 0: }, + 0: "bf16": { + 0: "enabled": true + 0: }, + 0: "steps_per_print": 2.000000e+03, + 0: "wall_clock_breakdown": false + 0: } +52: Time to load utils op: 0.013350963592529297 seconds +52: Time to load utils op: 0.008359670639038086 seconds +56: Time to load utils op: 0.0072062015533447266 seconds + 0: Time to load utils op: 0.011713504791259766 seconds + 0: [2023-04-29 11:26:36,051] [INFO] [engine.py:87:__init__] CONFIG: micro_batches=4 micro_batch_size=1 +43: Time to load utils op: 0.007218360900878906 seconds +43: Time to load utils op: 0.00684809684753418 seconds +56: Time to load utils op: 0.009788990020751953 seconds +43: Time to load utils op: 0.020364999771118164 seconds +56: Time to load utils op: 0.019504785537719727 seconds +56: Time to load utils op: 0.02156519889831543 seconds +43: Time to load utils op: 0.025338411331176758 seconds + 0: ninja: no work to do. + 0: Time to load utils op: 0.383289098739624 seconds + 0: Time to load utils op: 0.0042209625244140625 seconds +28: Time to load utils op: 0.9096662998199463 seconds +24: Time to load utils op: 0.905526876449585 seconds +23: Time to load utils op: 0.9529955387115479 seconds +13: Time to load utils op: 0.9632806777954102 seconds +28: Time to load utils op: 0.9306552410125732 seconds +24: Time to load utils op: 0.911431074142456 seconds +12: Time to load utils op: 0.9170932769775391 seconds +23: Time to load utils op: 0.9562265872955322 seconds +24: Time to load utils op: 0.9148273468017578 seconds +23: Time to load utils op: 0.9564869403839111 seconds +20: Time to load utils op: 0.9167516231536865 seconds +30: Time to load utils op: 0.9122886657714844 seconds +13: Time to load utils op: 0.9690158367156982 seconds +28: Time to load utils op: 0.9216804504394531 seconds +21: Time to load utils op: 0.9177565574645996 seconds +24: Time to load utils op: 0.918346643447876 seconds +12: Time to load utils op: 0.9233558177947998 seconds +23: Time to load utils op: 0.9624133110046387 seconds +20: Time to load utils op: 0.9229676723480225 seconds +30: Time to load utils op: 0.9184277057647705 seconds +13: Time to load utils op: 0.9751756191253662 seconds + 0: Time to load utils op: 1.0172946453094482 seconds +28: Time to load utils op: 0.928037166595459 seconds +21: Time to load utils op: 0.9236483573913574 seconds +12: Time to load utils op: 0.9295225143432617 seconds +20: Time to load utils op: 0.9288599491119385 seconds +30: Time to load utils op: 0.9245090484619141 seconds +13: Time to load utils op: 0.9815382957458496 seconds + 0: Time to load utils op: 1.0231800079345703 seconds +21: Time to load utils op: 0.9296867847442627 seconds +12: Time to load utils op: 0.9353220462799072 seconds +20: Time to load utils op: 0.9351978302001953 seconds +30: Time to load utils op: 0.9303295612335205 seconds + 0: Time to load utils op: 1.0296897888183594 seconds +21: Time to load utils op: 0.9356124401092529 seconds + 7: Time to load utils op: 0.9716174602508545 seconds +22: Time to load utils op: 0.9851851463317871 seconds +25: Time to load utils op: 0.9863710403442383 seconds + 7: Time to load utils op: 0.9626872539520264 seconds +27: Time to load utils op: 0.9946832656860352 seconds +25: Time to load utils op: 0.9893317222595215 seconds +22: Time to load utils op: 0.9912288188934326 seconds +10: Time to load utils op: 1.0439703464508057 seconds + 3: Time to load utils op: 1.0506610870361328 seconds + 7: Time to load utils op: 0.968980073928833 seconds +27: Time to load utils op: 1.0008313655853271 seconds +27: Time to load utils op: 0.997816801071167 secondsTime to load utils op: 1.0009229183197021 seconds +27: +26: Time to load utils op: 1.041250228881836 seconds +25: Time to load utils op: 0.9985413551330566 seconds + 8: Time to load utils op: 1.0522825717926025 seconds +22: Time to load utils op: 0.9972352981567383 seconds +10: Time to load utils op: 1.049656867980957 seconds + 6: Time to load utils op: 1.0539724826812744 seconds + 3: Time to load utils op: 1.056335210800171 seconds + 5: Time to load utils op: 1.0559442043304443 seconds + 7: Time to load utils op: 0.9748153686523438 seconds +26: Time to load utils op: 1.0470504760742188 seconds +25: Time to load utils op: 1.004392147064209 seconds + 8: Time to load utils op: 1.057401418685913 seconds +22: Time to load utils op: 1.0007555484771729 seconds +10: Time to load utils op: 1.0562481880187988 seconds + 6: Time to load utils op: 1.060617208480835 seconds + 3: Time to load utils op: 1.0621068477630615 seconds + 5: Time to load utils op: 1.0616121292114258 seconds +29: Time to load utils op: 1.0491914749145508 seconds +26: Time to load utils op: 1.053154468536377 seconds + 8: Time to load utils op: 1.0640208721160889 seconds + 2: Time to load utils op: 1.0481295585632324 seconds +15: Time to load utils op: 0.9839377403259277 seconds +10: Time to load utils op: 1.0622897148132324 seconds + 6: Time to load utils op: 1.0668752193450928 seconds + 3: Time to load utils op: 1.0682151317596436 seconds + 5: Time to load utils op: 1.067765712738037 seconds +29: Time to load utils op: 1.055246353149414 seconds + 1: Time to load utils op: 0.9927449226379395 seconds +14: Time to load utils op: 1.0255472660064697 seconds +26: Time to load utils op: 1.0602281093597412 seconds +31: Time to load utils op: 0.988276481628418 seconds + 2: Time to load utils op: 1.0540766716003418 seconds +15: Time to load utils op: 1.005110740661621 seconds + 8: Time to load utils op: 1.0694074630737305 seconds + 6: Time to load utils op: 1.0726709365844727 seconds + 5: Time to load utils op: 1.074563980102539 seconds +29: Time to load utils op: 1.0615596771240234 seconds + 1: Time to load utils op: 0.9989709854125977 seconds +23: Time to load utils op: 0.002014636993408203 seconds +14: Time to load utils op: 1.0207369327545166 seconds +17: Time to load utils op: 1.028618335723877 seconds +31: Time to load utils op: 0.9940967559814453 seconds +23: Time to load utils op: 0.0003509521484375 seconds + 2: Time to load utils op: 1.0601508617401123 seconds +15: Time to load utils op: 0.9956498146057129 seconds + 1: Time to load utils op: 1.0052659511566162 seconds +29: Time to load utils op: 1.0677969455718994 seconds +14: Time to load utils op: 1.0267486572265625 seconds +17: Time to load utils op: 1.0315735340118408 seconds +18: Time to load utils op: 0.9966104030609131 seconds +31: Time to load utils op: 1.0005035400390625 seconds + 2: Time to load utils op: 1.0662617683410645 seconds +15: Time to load utils op: 1.0016891956329346 seconds +19: Time to load utils op: 0.9993910789489746 seconds +16: Time to load utils op: 0.9959242343902588 seconds + 9: Time to load utils op: 0.9989233016967773 seconds +14: Time to load utils op: 1.0317752361297607 seconds + 4: Time to load utils op: 1.0492351055145264 seconds +11: Time to load utils op: 0.9990394115447998 seconds +23: Time to load utils op: 0.0004429817199707031 seconds + 1: Time to load utils op: 1.0112388134002686 seconds +17: Time to load utils op: 1.04058837890625 seconds +18: Time to load utils op: 1.0026285648345947 seconds +17: Time to load utils op: 1.037574052810669 seconds +31: Time to load utils op: 1.0127770900726318 seconds +11: Time to load utils op: 1.0020592212677002 seconds +19: Time to load utils op: 0.9993484020233154 seconds +16: Time to load utils op: 1.002131462097168 seconds + 9: Time to load utils op: 1.005124807357788 seconds + 4: Time to load utils op: 1.0549969673156738 seconds +18: Time to load utils op: 1.00846529006958 seconds +19: Time to load utils op: 1.0115258693695068 seconds +11: Time to load utils op: 1.0084431171417236 seconds +23: Time to load utils op: 0.000400543212890625 seconds +11: Time to load utils op: 1.008692741394043 seconds + 9: Time to load utils op: 1.0112178325653076 seconds +16: Time to load utils op: 1.0081965923309326 seconds + 4: Time to load utils op: 1.0614182949066162 seconds +18: Time to load utils op: 1.0148353576660156 seconds +19: Time to load utils op: 1.0113162994384766 seconds + 9: Time to load utils op: 1.0171046257019043 seconds +16: Time to load utils op: 1.0140678882598877 seconds + 4: Time to load utils op: 1.0671794414520264 seconds +12: Time to load utils op: 0.0004987716674804688 seconds +12: Time to load utils op: 0.0004298686981201172 seconds +12: Time to load utils op: 0.0004909038543701172 seconds +12: Time to load utils op: 0.0004825592041015625 seconds + 0: [2023-04-29 11:26:37,067] [INFO] [engine.py:145:__init__] RANK=0 STAGE=0 LAYERS=24 [0, 24) STAGE_PARAMS=2226419712 (2226.420M) TOTAL_PARAMS=8905695232 (8905.695M) UNIQUE_PARAMS=8682348544 (8682.349M) + 0: [2023-04-29 11:26:37,067] [INFO] [engine.py:145:__init__] RANK=1 STAGE=0 LAYERS=24 [0, 24) STAGE_PARAMS=2226419712 (2226.420M) TOTAL_PARAMS=8905695232 (8905.695M) UNIQUE_PARAMS=8682348544 (8682.349M) +32: [2023-04-29 11:26:37,069] [INFO] [engine.py:145:__init__] RANK=256 STAGE=1 LAYERS=25 [24, 49) STAGE_PARAMS=2226427904 (2226.428M) TOTAL_PARAMS=8905695232 (8905.695M) UNIQUE_PARAMS=8682348544 (8682.349M) +32: [2023-04-29 11:26:37,069] [INFO] [engine.py:145:__init__] RANK=257 STAGE=1 LAYERS=25 [24, 49) STAGE_PARAMS=2226427904 (2226.428M) TOTAL_PARAMS=8905695232 (8905.695M) UNIQUE_PARAMS=8682348544 (8682.349M) +17: Time to load utils op: 0.003484010696411133 seconds +17: Time to load utils op: 0.006563901901245117 seconds +17: Time to load utils op: 0.006020069122314453 secondsTime to load utils op: 0.0060465335845947266 seconds +17: +22: Time to load utils op: 0.003596067428588867 seconds +22: Time to load utils op: 0.00647425651550293 seconds +22: Time to load utils op: 0.005919694900512695 secondsTime to load utils op: 0.005898475646972656 seconds +22: +13: Time to load utils op: 0.0044403076171875 seconds +13: Time to load utils op: 0.0004630088806152344 seconds +13: Time to load utils op: 0.0003809928894042969 seconds +13: Time to load utils op: 0.0003833770751953125 seconds +27: Time to load utils op: 0.003609180450439453 secondsTime to load utils op: 0.003606081008911133 seconds +27: +27: Time to load utils op: 0.00603175163269043 secondsTime to load utils op: 0.00607752799987793 seconds +27: +26: Time to load utils op: 0.0061528682708740234 seconds +26: Time to load utils op: 0.006081104278564453 secondsTime to load utils op: 0.00605463981628418 seconds +26: +26: Time to load utils op: 0.005950212478637695 seconds + 8: Time to load utils op: 0.003562450408935547 seconds + 8: Time to load utils op: 0.003543853759765625 seconds + 8: Time to load utils op: 0.0035445690155029297 seconds +11: Time to load utils op: 0.0039598941802978516 seconds + 8: Time to load utils op: 0.006503105163574219 seconds +29: Time to load utils op: 0.004538774490356445 seconds +11: Time to load utils op: 0.0004088878631591797 seconds +11: Time to load utils op: 0.00037407875061035156 seconds +11: Time to load utils op: 0.0003914833068847656 seconds +29: Time to load utils op: 0.0004792213439941406 seconds +29: Time to load utils op: 0.0004918575286865234 seconds +29: Time to load utils op: 0.0004734992980957031 seconds +16: Time to load utils op: 0.001409292221069336 secondsTime to load utils op: 0.0015447139739990234 seconds +16: +16: Time to load utils op: 0.00047850608825683594 seconds +16: Time to load utils op: 0.0004024505615234375 seconds + 5: Time to load utils op: 0.005834102630615234 seconds + 5: Time to load utils op: 0.0060024261474609375 seconds + 5: Time to load utils op: 0.005772829055786133 seconds + 5: Time to load utils op: 0.00577998161315918 seconds + 0: Time to load utils op: 0.004048824310302734 seconds + 0: Time to load utils op: 0.004042148590087891 seconds + 0: Time to load utils op: 0.004060029983520508 seconds +28: Time to load utils op: 0.00426936149597168 seconds +24: Time to load utils op: 0.004401206970214844 secondsTime to load utils op: 0.004411220550537109 secondsTime to load utils op: 0.004455089569091797 seconds +24: +24: +28: Time to load utils op: 0.003956794738769531 seconds +30: Time to load utils op: 0.003993511199951172 seconds +28: Time to load utils op: 0.0003905296325683594 seconds +24: Time to load utils op: 0.0004744529724121094 seconds +30: Time to load utils op: 0.00040650367736816406 seconds +30: Time to load utils op: 0.0004994869232177734 seconds +30: Time to load utils op: 0.00048065185546875 seconds +20: Time to load utils op: 0.0044481754302978516 seconds +20: Time to load utils op: 0.004464387893676758 seconds +20: Time to load utils op: 0.0038423538208007812 seconds +28: Time to load utils op: 0.00048422813415527344 seconds +21: Time to load utils op: 0.0039789676666259766 secondsTime to load utils op: 0.003936290740966797 seconds +21: + 9: Time to load utils op: 0.003909111022949219 seconds +21: Time to load utils op: 0.00042438507080078125 seconds + 9: Time to load utils op: 0.00047326087951660156 seconds +14: Time to load utils op: 0.003757953643798828 seconds +21: Time to load utils op: 0.0003407001495361328 seconds + 9: Time to load utils op: 0.003960132598876953 secondsTime to load utils op: 0.0039556026458740234 seconds + 9: +20: Time to load utils op: 0.00047850608825683594 seconds +14: Time to load utils op: 0.003901958465576172 seconds +14: Time to load utils op: 0.00047588348388671875 seconds +14: Time to load utils op: 0.0004336833953857422 seconds +25: Time to load utils op: 0.0040645599365234375 secondsTime to load utils op: 0.0038781166076660156 seconds +25: +25: Time to load utils op: 0.0038597583770751953 seconds + 7: Time to load utils op: 0.004319429397583008 seconds + 7: Time to load utils op: 0.0004763603210449219 seconds +25: Time to load utils op: 0.0004172325134277344 seconds + 7: Time to load utils op: 0.00048661231994628906 seconds + 7: Time to load utils op: 0.00041675567626953125 seconds + 6: Time to load utils op: 0.003872394561767578 seconds +10: Time to load utils op: 0.003966331481933594 seconds +10: Time to load utils op: 0.0039157867431640625 seconds +10: Time to load utils op: 0.001163482666015625 seconds + 6: Time to load utils op: 0.0003924369812011719 seconds + 6: Time to load utils op: 0.0004582405090332031 seconds +31: Time to load utils op: 0.003978729248046875 secondsTime to load utils op: 0.0039522647857666016 seconds +31: + 2: Time to load utils op: 0.004379987716674805 secondsTime to load utils op: 0.00440669059753418 seconds + 2: +31: Time to load utils op: 0.000453948974609375 seconds + 1: Time to load utils op: 0.003954172134399414 secondsTime to load utils op: 0.0039577484130859375 seconds + 1: + 3: Time to load utils op: 0.004003763198852539 seconds + 3: Time to load utils op: 0.0040051937103271484 seconds + 3: Time to load utils op: 0.004072904586791992 seconds +15: Time to load utils op: 0.004215717315673828 seconds +10: Time to load utils op: 0.00047516822814941406 seconds + 1: Time to load utils op: 0.004263877868652344 seconds + 6: Time to load utils op: 0.00039505958557128906 seconds +31: Time to load utils op: 0.0004048347473144531 seconds + 2: Time to load utils op: 0.0003695487976074219 seconds +15: Time to load utils op: 0.0043909549713134766 seconds +15: Time to load utils op: 0.00037860870361328125 seconds + 3: Time to load utils op: 0.0004999637603759766 seconds + 2: Time to load utils op: 0.00036144256591796875 seconds + 1: Time to load utils op: 0.0003790855407714844 seconds +19: Time to load utils op: 0.0041942596435546875 secondsTime to load utils op: 0.0038518905639648438 seconds +19: +15: Time to load utils op: 0.0004012584686279297 seconds +18: Time to load utils op: 0.003887653350830078 secondsTime to load utils op: 0.0038793087005615234 seconds +18: +18: Time to load utils op: 0.0042269229888916016 seconds + 4: Time to load utils op: 0.00395655632019043 seconds +19: Time to load utils op: 0.00047397613525390625 seconds + 4: Time to load utils op: 0.004137277603149414 seconds +19: Time to load utils op: 0.000396728515625 seconds + 4: Time to load utils op: 0.0004591941833496094 secondsTime to load utils op: 0.00045609474182128906 seconds + 4: +18: Time to load utils op: 0.0004820823669433594 seconds +38: [2023-04-29 11:26:39,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 11:26:39,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 11:26:39,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 11:26:39,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 11:26:39,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 11:26:39,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 11:26:39,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +38: [2023-04-29 11:26:39,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 11:26:39,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 11:26:39,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 11:26:39,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 11:26:39,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 11:26:39,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +33: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 11:26:39,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +43: [2023-04-29 11:26:39,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 11:26:39,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 11:26:39,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +36: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +50: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +49: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +57: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +59: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +45: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +48: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +37: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +60: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +41: [2023-04-29 11:26:39,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 11:26:39,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 11:26:39,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 11:26:39,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 11:26:39,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 11:26:39,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 11:26:39,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 11:26:39,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +53: [2023-04-29 11:26:39,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +33: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +33: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +33: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +33: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +53: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +53: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +33: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +33: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +53: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +53: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +53: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +33: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +53: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... + 3: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +51: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +38: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... + 3: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +43: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... + 3: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 3: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 3: [2023-04-29 11:26:39,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 3: [2023-04-29 11:26:39,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 3: [2023-04-29 11:26:39,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 3: [2023-04-29 11:26:39,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 3: [2023-04-29 11:26:39,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 4: [2023-04-29 11:26:39,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 11:26:39,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 11:26:39,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 4: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 6: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +55: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +39: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +39: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +39: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +39: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +39: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +39: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +39: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... + 4: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +55: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +54: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +39: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 3: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 11:26:39,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +39: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +39: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +55: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +55: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +55: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +55: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +55: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +39: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +39: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +39: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +39: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +55: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +55: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +55: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +39: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +39: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +23: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +13: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +13: [2023-04-29 11:26:39,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +13: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +13: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +13: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +23: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +23: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 6: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 6: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +11: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +12: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +13: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 11:26:39,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... + 7: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... + 7: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +13: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +32: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +12: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 7: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 7: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 7: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +12: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +11: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +11: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +12: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +36: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +24: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +30: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 7: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +62: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... + 7: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... + 7: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +24: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 7: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 5: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... + 7: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +56: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +30: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 5: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 0: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 0: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +56: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... + 0: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 5: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 5: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 5: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +30: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +24: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +40: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +10: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +40: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +30: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +24: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +18: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +40: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +40: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +40: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +26: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +25: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +40: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +40: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +40: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +40: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +40: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +26: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +18: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 5: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 8: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +18: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +18: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 5: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +26: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +26: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 0: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +25: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +15: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +50: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +15: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +10: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +15: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +15: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 8: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +29: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +29: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +29: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +29: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 8: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 0: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 5: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +10: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +26: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +49: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 9: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +15: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +16: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +16: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 8: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +35: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +16: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 8: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +16: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +26: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +16: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +16: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +16: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +26: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +17: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +42: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +15: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +42: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... + 1: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +42: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +29: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +22: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +31: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +42: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +44: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +15: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 9: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +63: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +58: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +27: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +44: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +45: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +14: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +47: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +47: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +29: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 1: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +42: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +17: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +42: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +29: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 1: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +42: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +42: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +45: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +45: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 9: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +45: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +44: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +44: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 9: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +45: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +45: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +16: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +31: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +22: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +44: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +44: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +17: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +31: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +44: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +59: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +22: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +20: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +44: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +44: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +27: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... + 9: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +52: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +22: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +41: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +19: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... + 1: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +31: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +16: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +57: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +37: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... + 1: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +16: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +48: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +60: [2023-04-29 11:26:39,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +31: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +60: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +60: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +16: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +17: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +31: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +22: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 11:26:39,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +27: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 1: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 1: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +20: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +19: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:39,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +14: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +53: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +53: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +53: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +33: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +33: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +33: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +33: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +53: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +14: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +53: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +53: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +53: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +14: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +43: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +14: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +43: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +38: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +38: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +43: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +53: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +55: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +39: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +39: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +36: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +43: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +55: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +38: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +39: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +55: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +20: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +36: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +36: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +38: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +54: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +54: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +54: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +39: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +40: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +50: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +50: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +33: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +33: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +32: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +53: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +20: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +33: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +33: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +56: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +56: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +43: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +43: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +32: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +63: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +32: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +55: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +54: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +42: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +33: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +36: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +43: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +62: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +62: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +62: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +53: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +58: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +33: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +35: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +50: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +48: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +56: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +44: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +60: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +60: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +60: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +32: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +53: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +57: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +57: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +58: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +42: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +42: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +33: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +62: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +55: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +58: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +44: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +53: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +38: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +44: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +45: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +50: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +53: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +58: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +48: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +35: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +52: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +52: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +43: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +55: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +48: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +42: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +37: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +53: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +54: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +47: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +47: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +47: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +52: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +63: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +59: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +55: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +43: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +45: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +57: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +59: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +55: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +48: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +54: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +52: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +43: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +37: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +39: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +38: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +47: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +39: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +36: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +60: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +45: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +50: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +38: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +39: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +33: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +32: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +32: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +59: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +44: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +36: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +36: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +43: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +39: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +36: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +62: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +39: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +37: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +41: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +40: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +36: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +50: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +62: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +32: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +55: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +39: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +56: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +40: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +43: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +33: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +40: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +35: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +32: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +35: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +62: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +35: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +50: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +58: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +42: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +41: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +62: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +55: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +58: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +56: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +52: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +50: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +55: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +56: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +35: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +62: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +54: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +45: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +42: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +59: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +58: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +35: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +52: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +45: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +63: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +57: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +55: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +59: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +37: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +36: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +48: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +42: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +39: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +36: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +62: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +48: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +54: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +56: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +44: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +50: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +36: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +57: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +56: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +62: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +48: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +40: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +60: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +60: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +63: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +42: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +40: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +35: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +52: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +35: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +47: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +37: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +41: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +41: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +45: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +57: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +52: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +37: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:39,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 4: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 4: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 4: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 4: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +28: [2023-04-29 11:26:39,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 4: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 4: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 6: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 3: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +23: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 3: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +30: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +30: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +30: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 6: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +28: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +23: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 3: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +11: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +13: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +13: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +13: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 6: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +24: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +24: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +28: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +11: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +11: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +24: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +12: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +12: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +12: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +18: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +18: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +18: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 7: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 7: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 7: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +28: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +13: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +15: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +15: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 0: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 0: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 0: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +31: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +23: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +25: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +25: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 7: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +15: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +24: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +31: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +31: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +12: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +30: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 9: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 9: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 9: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +28: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +15: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 8: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 8: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 8: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +25: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 0: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 5: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 5: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 5: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 9: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +11: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +26: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +26: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +18: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +27: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +27: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +27: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 6: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +22: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +22: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 3: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 5: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +16: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +16: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 3: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +23: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +22: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +30: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +29: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +29: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +29: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 1: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 1: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +30: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +13: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +19: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +28: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +23: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 6: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +24: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +24: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +25: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +18: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +24: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +29: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 1: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 7: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +23: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +17: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 2: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 0: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +24: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +30: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 0: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +11: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 8: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +31: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +26: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +10: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +29: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +16: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +19: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +29: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +19: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +19: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +28: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +28: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +28: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +21: [2023-04-29 11:26:39,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 11:26:39,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +61: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +61: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +61: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +61: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +61: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +61: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +61: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +20: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +28: [2023-04-29 11:26:39,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +61: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +61: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +61: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +61: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +61: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +61: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +61: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +61: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +61: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +34: [2023-04-29 11:26:39,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +61: [2023-04-29 11:26:39,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +21: [2023-04-29 11:26:39,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... +34: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +61: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +21: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +61: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +21: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +61: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +21: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +61: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +21: [2023-04-29 11:26:39,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +34: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +34: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +61: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +21: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +34: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +61: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +21: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +34: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +21: [2023-04-29 11:26:39,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +34: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +61: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +61: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +21: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +21: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +21: [2023-04-29 11:26:39,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +34: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +34: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +21: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. +34: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +21: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +34: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +14: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +61: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +21: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +34: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +21: [2023-04-29 11:26:39,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +34: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +34: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +28: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:39,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:39,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:39,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 11:26:39,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 11:26:39,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... + 2: [2023-04-29 11:26:39,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 2: [2023-04-29 11:26:39,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 2: [2023-04-29 11:26:39,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 2: [2023-04-29 11:26:39,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt... + 2: [2023-04-29 11:26:39,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 11:26:39,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 11:26:39,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 11:26:39,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 11:26:39,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 11:26:39,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +46: [2023-04-29 11:26:39,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt... +46: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +46: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +46: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +46: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +46: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +46: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +46: [2023-04-29 11:26:39,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. + 2: [2023-04-29 11:26:39,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +46: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_00_model_states.pt. +46: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +46: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +46: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +46: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +46: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... +46: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt... + 2: [2023-04-29 11:26:39,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +46: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +46: [2023-04-29 11:26:39,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt... +46: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +46: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +46: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +46: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +46: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +46: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +46: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +46: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +46: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 2: [2023-04-29 11:26:39,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 2: [2023-04-29 11:26:39,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 2: [2023-04-29 11:26:39,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 2: [2023-04-29 11:26:39,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 11:26:39,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 11:26:39,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 11:26:39,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_01_model_states.pt. + 2: [2023-04-29 11:26:39,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +51: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +51: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +51: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +51: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +51: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +51: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +51: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +51: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +51: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +49: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +49: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +49: [2023-04-29 11:26:39,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_03_model_states.pt. +49: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +49: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +49: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +49: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/mp_rank_02_model_states.pt. +49: [2023-04-29 11:26:39,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +49: [2023-04-29 11:26:39,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 11:26:40,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 11:26:40,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 11:26:40,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 11:26:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 11:26:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 11:26:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 11:26:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 11:26:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 11:26:40,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 11:26:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 11:26:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 11:26:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 11:26:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 11:26:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 11:26:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 11:26:40,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 11:26:40,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 5: [2023-04-29 11:26:40,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +32: [2023-04-29 11:26:40,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +39: [2023-04-29 11:26:40,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 11:26:40,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +39: [2023-04-29 11:26:40,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +39: [2023-04-29 11:26:40,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 11:26:40,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +39: [2023-04-29 11:26:40,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +39: [2023-04-29 11:26:40,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +54: [2023-04-29 11:26:40,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 11:26:40,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 11:26:40,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 11:26:40,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 11:26:40,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 11:26:40,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 11:26:40,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 11:26:40,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 11:26:40,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 11:26:40,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 5: [2023-04-29 11:26:40,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 5: [2023-04-29 11:26:40,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 5: [2023-04-29 11:26:40,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 11:26:40,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 5: [2023-04-29 11:26:40,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +54: [2023-04-29 11:26:40,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 11:26:40,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +32: [2023-04-29 11:26:40,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +32: [2023-04-29 11:26:40,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 11:26:40,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +32: [2023-04-29 11:26:40,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 11:26:40,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +54: [2023-04-29 11:26:40,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 11:26:40,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 11:26:40,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +32: [2023-04-29 11:26:40,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +61: [2023-04-29 11:26:40,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 11:26:40,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 11:26:40,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 11:26:40,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 11:26:40,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 11:26:40,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 11:26:40,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 11:26:40,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 11:26:40,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 11:26:40,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +54: [2023-04-29 11:26:40,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +54: [2023-04-29 11:26:40,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... + 4: [2023-04-29 11:26:40,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 4: [2023-04-29 11:26:40,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +61: [2023-04-29 11:26:40,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +61: [2023-04-29 11:26:40,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 11:26:40,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +61: [2023-04-29 11:26:40,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 11:26:40,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +61: [2023-04-29 11:26:40,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +61: [2023-04-29 11:26:40,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +61: [2023-04-29 11:26:40,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 4: [2023-04-29 11:26:40,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +53: [2023-04-29 11:26:40,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 11:26:40,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 11:26:40,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 11:26:40,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 11:26:40,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 11:26:40,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 11:26:40,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 11:26:40,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 11:26:40,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +53: [2023-04-29 11:26:40,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +53: [2023-04-29 11:26:40,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 11:26:40,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 11:26:40,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +53: [2023-04-29 11:26:40,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +53: [2023-04-29 11:26:40,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +53: [2023-04-29 11:26:40,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 9: [2023-04-29 11:26:40,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 9: [2023-04-29 11:26:40,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 9: [2023-04-29 11:26:40,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 9: [2023-04-29 11:26:40,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +39: [2023-04-29 11:26:40,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 11:26:40,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 11:26:40,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +39: [2023-04-29 11:26:40,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 11:26:40,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +60: [2023-04-29 11:26:40,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 11:26:40,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +54: [2023-04-29 11:26:40,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 11:26:40,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 11:26:40,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 11:26:40,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 11:26:40,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 11:26:40,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 11:26:40,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 11:26:40,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 11:26:40,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 11:26:40,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 11:26:40,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +19: [2023-04-29 11:26:40,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 11:26:40,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +46: [2023-04-29 11:26:40,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 11:26:40,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 11:26:40,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 11:26:40,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +19: [2023-04-29 11:26:40,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 11:26:40,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 11:26:40,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 11:26:40,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 11:26:40,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 11:26:40,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +39: [2023-04-29 11:26:40,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +23: [2023-04-29 11:26:40,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 11:26:40,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 11:26:40,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 11:26:40,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 11:26:40,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 11:26:40,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 11:26:40,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 11:26:40,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +60: [2023-04-29 11:26:40,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +32: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +32: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +46: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +26: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +54: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +54: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +46: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... + 5: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +60: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +60: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +15: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +60: [2023-04-29 11:26:40,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... + 8: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +60: [2023-04-29 11:26:40,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... + 8: [2023-04-29 11:26:40,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +46: [2023-04-29 11:26:40,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +46: [2023-04-29 11:26:40,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +19: [2023-04-29 11:26:40,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +61: [2023-04-29 11:26:40,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +61: [2023-04-29 11:26:40,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +19: [2023-04-29 11:26:40,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +19: [2023-04-29 11:26:40,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 4: [2023-04-29 11:26:40,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +39: [2023-04-29 11:26:40,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +19: [2023-04-29 11:26:40,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +60: [2023-04-29 11:26:40,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 11:26:40,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +27: [2023-04-29 11:26:40,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 11:26:40,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +46: [2023-04-29 11:26:40,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +31: [2023-04-29 11:26:40,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +46: [2023-04-29 11:26:40,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +46: [2023-04-29 11:26:40,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +27: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 3: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +60: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +23: [2023-04-29 11:26:40,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +19: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +19: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +23: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +23: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +23: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +13: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 11:26:40,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +61: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +26: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +61: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +24: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +24: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 11:26:40,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +39: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +17: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +39: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +11: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +11: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 11:26:40,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 11:26:40,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 11:26:40,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +23: [2023-04-29 11:26:40,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +54: [2023-04-29 11:26:40,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +15: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +25: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +16: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +21: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 11:26:40,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +31: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +27: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +27: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +15: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +26: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +15: [2023-04-29 11:26:40,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 3: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +26: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +27: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +31: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +27: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +27: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +27: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +27: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 8: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +12: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +12: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 11:26:40,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 8: [2023-04-29 11:26:40,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 11:26:40,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 4: [2023-04-29 11:26:40,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 11:26:40,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 8: [2023-04-29 11:26:40,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +31: [2023-04-29 11:26:40,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +24: [2023-04-29 11:26:40,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +54: [2023-04-29 11:26:40,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 11:26:40,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 8: [2023-04-29 11:26:40,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 11:26:40,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 11:26:40,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 11:26:40,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 11:26:40,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 11:26:40,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +30: [2023-04-29 11:26:40,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +30: [2023-04-29 11:26:40,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +13: [2023-04-29 11:26:40,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 11:26:40,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 11:26:40,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 6: [2023-04-29 11:26:40,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 11:26:40,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 6: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 3: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +13: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +13: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +13: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +13: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 6: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 6: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 6: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 6: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 3: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +11: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 11:26:40,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 11:26:40,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +11: [2023-04-29 11:26:40,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +22: [2023-04-29 11:26:40,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +24: [2023-04-29 11:26:40,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 11:26:40,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +22: [2023-04-29 11:26:40,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +21: [2023-04-29 11:26:40,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 11:26:40,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +24: [2023-04-29 11:26:40,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +24: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +21: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +25: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +24: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +21: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +24: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 7: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +21: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 3: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +17: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +21: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +25: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +25: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 11:26:40,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:40,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 7: [2023-04-29 11:26:40,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +25: [2023-04-29 11:26:40,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +12: [2023-04-29 11:26:40,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:40,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:40,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +21: [2023-04-29 11:26:40,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +12: [2023-04-29 11:26:40,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 4: [2023-04-29 11:26:40,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 11:26:40,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:40,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 11:26:40,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +16: [2023-04-29 11:26:40,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +12: [2023-04-29 11:26:40,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +16: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +16: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +51: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +22: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +51: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +29: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +16: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +51: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +21: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +54: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +54: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +22: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +51: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +18: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 11:26:40,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +18: [2023-04-29 11:26:40,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 11:26:40,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +17: [2023-04-29 11:26:40,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +22: [2023-04-29 11:26:40,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +22: [2023-04-29 11:26:40,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 4: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 7: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +17: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 7: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +17: [2023-04-29 11:26:40,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 11:26:40,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +10: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 11:26:40,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 11:26:40,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +53: [2023-04-29 11:26:40,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 11:26:40,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +17: [2023-04-29 11:26:40,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +11: [2023-04-29 11:26:40,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 11:26:40,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +11: [2023-04-29 11:26:40,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 11:26:40,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 11:26:40,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 5: [2023-04-29 11:26:40,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 11:26:40,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +29: [2023-04-29 11:26:40,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 11:26:40,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +51: [2023-04-29 11:26:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +51: [2023-04-29 11:26:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +51: [2023-04-29 11:26:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +61: [2023-04-29 11:26:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +18: [2023-04-29 11:26:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +11: [2023-04-29 11:26:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +61: [2023-04-29 11:26:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 11:26:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 11:26:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +51: [2023-04-29 11:26:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +51: [2023-04-29 11:26:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +51: [2023-04-29 11:26:40,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +18: [2023-04-29 11:26:40,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +53: [2023-04-29 11:26:40,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +53: [2023-04-29 11:26:40,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +18: [2023-04-29 11:26:40,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +61: [2023-04-29 11:26:40,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +29: [2023-04-29 11:26:40,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 2: [2023-04-29 11:26:40,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 11:26:40,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 11:26:40,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 11:26:40,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 11:26:40,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 11:26:40,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 11:26:40,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 11:26:40,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 11:26:40,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +18: [2023-04-29 11:26:40,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +18: [2023-04-29 11:26:40,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +32: [2023-04-29 11:26:40,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +18: [2023-04-29 11:26:40,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 4: [2023-04-29 11:26:40,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 11:26:40,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +61: [2023-04-29 11:26:40,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 0: [2023-04-29 11:26:40,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 11:26:40,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 11:26:40,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 11:26:40,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 11:26:40,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 11:26:40,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 11:26:40,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 11:26:40,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 11:26:40,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +10: [2023-04-29 11:26:40,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +29: [2023-04-29 11:26:40,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +32: [2023-04-29 11:26:40,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 1: [2023-04-29 11:26:40,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 11:26:40,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 11:26:40,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 11:26:40,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 11:26:40,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 11:26:40,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 11:26:40,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 11:26:40,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 11:26:40,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 11:26:40,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:40,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 11:26:40,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 11:26:40,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 11:26:40,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 11:26:40,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 11:26:40,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 11:26:40,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 11:26:40,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 11:26:40,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 11:26:40,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +29: [2023-04-29 11:26:40,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +32: [2023-04-29 11:26:40,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 11:26:40,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +10: [2023-04-29 11:26:40,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:40,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 11:26:40,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 11:26:40,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 11:26:40,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 11:26:40,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 11:26:40,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 11:26:40,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 11:26:40,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 11:26:40,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 11:26:40,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 11:26:40,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 11:26:40,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 2: [2023-04-29 11:26:40,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 2: [2023-04-29 11:26:40,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 2: [2023-04-29 11:26:40,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 9: [2023-04-29 11:26:40,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 11:26:40,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 9: [2023-04-29 11:26:40,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 11:26:40,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +10: [2023-04-29 11:26:40,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 0: [2023-04-29 11:26:40,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +10: [2023-04-29 11:26:40,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 1: [2023-04-29 11:26:40,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +10: [2023-04-29 11:26:40,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 1: [2023-04-29 11:26:40,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:40,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +14: [2023-04-29 11:26:40,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +14: [2023-04-29 11:26:40,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 1: [2023-04-29 11:26:40,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 0: [2023-04-29 11:26:40,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 1: [2023-04-29 11:26:40,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 11:26:40,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 11:26:40,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 11:26:40,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 0: [2023-04-29 11:26:40,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 0: [2023-04-29 11:26:40,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +10: [2023-04-29 11:26:40,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:40,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:40,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 1: [2023-04-29 11:26:40,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:40,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 1: [2023-04-29 11:26:40,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +20: [2023-04-29 11:26:40,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 1: [2023-04-29 11:26:40,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +14: [2023-04-29 11:26:40,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +14: [2023-04-29 11:26:40,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:40,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +53: [2023-04-29 11:26:40,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 11:26:40,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +14: [2023-04-29 11:26:40,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:40,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +53: [2023-04-29 11:26:40,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 11:26:40,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +20: [2023-04-29 11:26:40,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +14: [2023-04-29 11:26:40,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +20: [2023-04-29 11:26:40,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +20: [2023-04-29 11:26:40,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +46: [2023-04-29 11:26:40,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 11:26:40,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 11:26:40,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 11:26:40,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 11:26:40,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 11:26:40,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 11:26:40,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 11:26:40,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 11:26:40,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 11:26:40,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 11:26:40,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 11:26:40,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 11:26:40,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 11:26:40,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 11:26:40,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 11:26:40,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 11:26:40,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +60: [2023-04-29 11:26:40,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +46: [2023-04-29 11:26:40,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +19: [2023-04-29 11:26:40,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +50: [2023-04-29 11:26:40,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +50: [2023-04-29 11:26:40,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +62: [2023-04-29 11:26:40,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 11:26:40,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +62: [2023-04-29 11:26:40,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 11:26:40,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 11:26:40,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +60: [2023-04-29 11:26:40,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 11:26:40,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +50: [2023-04-29 11:26:40,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +19: [2023-04-29 11:26:40,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +62: [2023-04-29 11:26:40,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 11:26:40,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +23: [2023-04-29 11:26:40,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +50: [2023-04-29 11:26:40,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 11:26:40,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 11:26:40,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +50: [2023-04-29 11:26:40,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 8: [2023-04-29 11:26:40,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +50: [2023-04-29 11:26:40,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +60: [2023-04-29 11:26:40,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 11:26:40,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +46: [2023-04-29 11:26:40,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +19: [2023-04-29 11:26:40,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 11:26:40,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 11:26:40,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +60: [2023-04-29 11:26:40,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +16: [2023-04-29 11:26:40,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 11:26:40,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 11:26:40,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 11:26:40,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 11:26:40,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 11:26:40,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 11:26:40,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 11:26:40,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 11:26:40,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 11:26:40,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 11:26:40,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 11:26:40,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 11:26:40,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 11:26:40,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 11:26:40,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 11:26:40,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 11:26:40,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 11:26:40,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 11:26:40,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 11:26:40,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 11:26:40,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 11:26:40,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 11:26:40,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 11:26:40,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +46: [2023-04-29 11:26:40,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +31: [2023-04-29 11:26:40,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 11:26:40,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 11:26:40,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 11:26:40,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 11:26:40,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 11:26:40,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 11:26:40,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 11:26:40,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +60: [2023-04-29 11:26:40,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +12: [2023-04-29 11:26:40,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 11:26:40,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 11:26:40,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 11:26:40,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +24: [2023-04-29 11:26:40,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +46: [2023-04-29 11:26:40,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +16: [2023-04-29 11:26:40,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 11:26:40,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 11:26:40,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +13: [2023-04-29 11:26:40,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 11:26:40,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 11:26:40,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 11:26:40,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 11:26:40,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +25: [2023-04-29 11:26:40,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 11:26:40,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +30: [2023-04-29 11:26:40,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 11:26:40,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 11:26:40,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 11:26:40,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 11:26:40,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +21: [2023-04-29 11:26:40,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 11:26:40,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +28: [2023-04-29 11:26:40,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +28: [2023-04-29 11:26:40,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +60: [2023-04-29 11:26:40,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +19: [2023-04-29 11:26:40,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 11:26:40,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +23: [2023-04-29 11:26:40,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 11:26:40,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 11:26:40,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +51: [2023-04-29 11:26:40,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +22: [2023-04-29 11:26:40,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 11:26:40,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +46: [2023-04-29 11:26:40,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 11:26:40,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 11:26:40,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 11:26:40,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 11:26:40,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 11:26:40,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 11:26:40,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 11:26:40,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 11:26:40,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 11:26:40,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 11:26:40,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 11:26:40,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 11:26:40,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 11:26:40,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... +28: [2023-04-29 11:26:40,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 11:26:40,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt... +28: [2023-04-29 11:26:40,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt... + 7: [2023-04-29 11:26:40,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 11:26:40,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +17: [2023-04-29 11:26:40,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 11:26:40,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 11:26:40,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 11:26:40,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 11:26:40,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +19: [2023-04-29 11:26:40,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 11:26:40,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +51: [2023-04-29 11:26:40,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 11:26:40,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +16: [2023-04-29 11:26:40,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 11:26:40,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 2: [2023-04-29 11:26:40,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +15: [2023-04-29 11:26:40,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 11:26:40,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +52: [2023-04-29 11:26:40,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 11:26:40,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 11:26:40,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 11:26:40,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 11:26:40,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 11:26:40,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 11:26:40,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +60: [2023-04-29 11:26:40,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 11:26:40,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 11:26:40,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +22: [2023-04-29 11:26:40,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 11:26:40,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 11:26:40,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +22: [2023-04-29 11:26:40,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 11:26:40,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +18: [2023-04-29 11:26:40,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 11:26:40,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 11:26:40,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +34: [2023-04-29 11:26:40,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +34: [2023-04-29 11:26:40,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +21: [2023-04-29 11:26:40,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:40,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 11:26:40,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +26: [2023-04-29 11:26:40,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 11:26:40,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 11:26:40,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:40,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 11:26:40,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 11:26:40,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 11:26:40,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 7: [2023-04-29 11:26:40,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 11:26:40,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 11:26:40,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 11:26:40,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +52: [2023-04-29 11:26:40,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +17: [2023-04-29 11:26:40,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +52: [2023-04-29 11:26:40,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +17: [2023-04-29 11:26:40,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 11:26:40,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +26: [2023-04-29 11:26:40,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 11:26:40,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 11:26:40,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +23: [2023-04-29 11:26:40,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 11:26:40,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +52: [2023-04-29 11:26:40,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +52: [2023-04-29 11:26:40,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... + 6: [2023-04-29 11:26:40,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 11:26:40,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 11:26:40,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 11:26:40,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 6: [2023-04-29 11:26:40,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 11:26:40,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +27: [2023-04-29 11:26:40,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +52: [2023-04-29 11:26:40,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +23: [2023-04-29 11:26:40,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +52: [2023-04-29 11:26:40,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 6: [2023-04-29 11:26:40,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:40,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:40,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 11:26:40,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +52: [2023-04-29 11:26:40,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 0: [2023-04-29 11:26:40,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +31: [2023-04-29 11:26:40,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 11:26:40,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 11:26:40,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +52: [2023-04-29 11:26:40,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +16: [2023-04-29 11:26:40,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 11:26:40,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 11:26:40,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +12: [2023-04-29 11:26:40,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 11:26:40,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 11:26:40,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 8: [2023-04-29 11:26:40,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 11:26:40,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 6: [2023-04-29 11:26:40,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 11:26:40,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +59: [2023-04-29 11:26:40,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 11:26:40,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 11:26:40,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 2: [2023-04-29 11:26:40,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +59: [2023-04-29 11:26:40,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 11:26:40,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 11:26:40,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 11:26:40,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +59: [2023-04-29 11:26:40,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 0: [2023-04-29 11:26:40,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +30: [2023-04-29 11:26:40,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 1: [2023-04-29 11:26:40,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 11:26:40,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 1: [2023-04-29 11:26:40,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 11:26:40,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +29: [2023-04-29 11:26:40,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 11:26:40,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 11:26:40,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 11:26:40,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 11:26:40,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 11:26:40,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 11:26:40,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 11:26:40,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 11:26:40,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 11:26:40,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 11:26:40,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 11:26:40,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 1: [2023-04-29 11:26:40,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 3: [2023-04-29 11:26:40,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 11:26:40,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 11:26:40,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 11:26:40,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 11:26:40,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 11:26:40,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 11:26:40,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 11:26:40,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +51: [2023-04-29 11:26:40,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 11:26:40,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 11:26:40,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 11:26:40,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 11:26:40,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 11:26:40,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 11:26:40,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 11:26:40,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 11:26:40,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +10: [2023-04-29 11:26:40,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 11:26:40,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. + 0: [2023-04-29 11:26:40,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 11:26:40,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 11:26:40,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 11:26:40,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +59: [2023-04-29 11:26:40,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +59: [2023-04-29 11:26:40,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +59: [2023-04-29 11:26:40,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +22: [2023-04-29 11:26:40,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 11:26:40,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +14: [2023-04-29 11:26:40,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +14: [2023-04-29 11:26:40,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +38: [2023-04-29 11:26:40,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +14: [2023-04-29 11:26:40,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +18: [2023-04-29 11:26:40,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 11:26:40,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 11:26:40,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 11:26:40,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 11:26:40,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 11:26:40,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +51: [2023-04-29 11:26:40,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +20: [2023-04-29 11:26:40,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +20: [2023-04-29 11:26:40,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +16: [2023-04-29 11:26:40,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 11:26:40,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 11:26:40,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +51: [2023-04-29 11:26:40,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +11: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +38: [2023-04-29 11:26:40,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +51: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +38: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +38: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +38: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +10: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +57: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +22: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +14: [2023-04-29 11:26:40,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +11: [2023-04-29 11:26:40,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +59: [2023-04-29 11:26:40,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 11:26:40,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +62: [2023-04-29 11:26:40,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 11:26:40,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 2: [2023-04-29 11:26:40,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 11:26:40,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +43: [2023-04-29 11:26:40,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 11:26:40,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 11:26:40,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +59: [2023-04-29 11:26:40,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +57: [2023-04-29 11:26:40,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +57: [2023-04-29 11:26:40,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +57: [2023-04-29 11:26:40,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... + 2: [2023-04-29 11:26:40,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +56: [2023-04-29 11:26:40,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 11:26:40,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 11:26:40,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 11:26:40,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 0: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +57: [2023-04-29 11:26:40,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +29: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +33: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 11:26:40,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +17: [2023-04-29 11:26:40,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +57: [2023-04-29 11:26:40,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 11:26:40,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +20: [2023-04-29 11:26:40,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +57: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +29: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +56: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 11:26:40,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 11:26:40,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 1: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +35: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 11:26:40,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 11:26:40,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 11:26:40,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 1: [2023-04-29 11:26:40,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +62: [2023-04-29 11:26:40,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +62: [2023-04-29 11:26:40,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 1: [2023-04-29 11:26:40,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +43: [2023-04-29 11:26:40,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +43: [2023-04-29 11:26:40,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 1: [2023-04-29 11:26:40,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +63: [2023-04-29 11:26:40,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 11:26:40,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 11:26:40,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 11:26:40,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 11:26:40,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 11:26:40,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +20: [2023-04-29 11:26:40,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +33: [2023-04-29 11:26:40,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:40,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 11:26:40,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 11:26:40,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 11:26:40,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 11:26:40,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 11:26:40,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 11:26:40,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +17: [2023-04-29 11:26:40,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +48: [2023-04-29 11:26:40,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 11:26:40,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 11:26:40,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +43: [2023-04-29 11:26:40,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 11:26:40,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 11:26:40,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +56: [2023-04-29 11:26:40,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 11:26:40,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 11:26:40,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 11:26:40,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +43: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +33: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +33: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +50: [2023-04-29 11:26:40,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 11:26:40,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 11:26:40,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +10: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +56: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. + 0: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +33: [2023-04-29 11:26:40,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +36: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... + 0: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +55: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +35: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +35: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +35: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +55: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 11:26:40,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 11:26:40,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 11:26:40,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 11:26:40,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 11:26:40,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:40,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:40,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:40,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +41: [2023-04-29 11:26:40,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 11:26:40,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +35: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +63: [2023-04-29 11:26:40,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +41: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +48: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +50: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +10: [2023-04-29 11:26:40,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +48: [2023-04-29 11:26:40,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 11:26:40,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:40,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 11:26:40,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 11:26:40,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +29: [2023-04-29 11:26:40,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 11:26:40,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +35: [2023-04-29 11:26:40,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:40,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +35: [2023-04-29 11:26:40,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:40,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 11:26:40,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +40: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +36: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +40: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +48: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +55: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +40: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 11:26:40,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +20: [2023-04-29 11:26:40,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +36: [2023-04-29 11:26:40,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +36: [2023-04-29 11:26:40,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:40,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 11:26:40,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +20: [2023-04-29 11:26:40,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +36: [2023-04-29 11:26:40,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:40,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 11:26:40,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 11:26:40,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 11:26:40,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 11:26:40,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +55: [2023-04-29 11:26:40,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +55: [2023-04-29 11:26:40,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:40,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +28: [2023-04-29 11:26:40,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +41: [2023-04-29 11:26:40,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +41: [2023-04-29 11:26:40,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:40,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +41: [2023-04-29 11:26:40,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 11:26:40,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +55: [2023-04-29 11:26:40,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +37: [2023-04-29 11:26:40,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 11:26:40,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:40,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 11:26:40,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 11:26:40,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 11:26:40,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:40,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 11:26:40,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 11:26:40,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 11:26:40,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 11:26:40,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +44: [2023-04-29 11:26:40,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:40,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +62: [2023-04-29 11:26:40,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 11:26:40,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +14: [2023-04-29 11:26:40,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +41: [2023-04-29 11:26:40,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:40,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +40: [2023-04-29 11:26:40,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +28: [2023-04-29 11:26:40,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +44: [2023-04-29 11:26:40,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +44: [2023-04-29 11:26:40,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +55: [2023-04-29 11:26:40,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +62: [2023-04-29 11:26:40,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +44: [2023-04-29 11:26:40,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +14: [2023-04-29 11:26:40,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +40: [2023-04-29 11:26:40,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:40,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +62: [2023-04-29 11:26:40,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +62: [2023-04-29 11:26:40,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +44: [2023-04-29 11:26:40,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:40,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +44: [2023-04-29 11:26:40,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +44: [2023-04-29 11:26:40,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +40: [2023-04-29 11:26:40,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:40,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:40,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:40,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:40,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +14: [2023-04-29 11:26:40,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 11:26:40,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +37: [2023-04-29 11:26:40,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +34: [2023-04-29 11:26:40,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 11:26:40,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +14: [2023-04-29 11:26:40,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +37: [2023-04-29 11:26:40,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +37: [2023-04-29 11:26:40,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:40,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +37: [2023-04-29 11:26:40,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +50: [2023-04-29 11:26:40,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 11:26:40,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +50: [2023-04-29 11:26:40,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 11:26:40,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 11:26:40,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 11:26:40,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +28: [2023-04-29 11:26:40,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +28: [2023-04-29 11:26:40,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 11:26:40,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_00-model_states.pt. +52: [2023-04-29 11:26:40,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +10: [2023-04-29 11:26:40,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 11:26:40,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 11:26:40,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 11:26:40,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 11:26:40,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 11:26:40,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 11:26:40,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 11:26:40,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 11:26:40,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 11:26:40,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 11:26:40,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 11:26:40,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 11:26:40,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 11:26:40,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +49: [2023-04-29 11:26:40,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +28: [2023-04-29 11:26:40,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +49: [2023-04-29 11:26:40,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +49: [2023-04-29 11:26:40,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +28: [2023-04-29 11:26:40,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +49: [2023-04-29 11:26:40,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +49: [2023-04-29 11:26:40,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +33: [2023-04-29 11:26:40,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 11:26:40,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 11:26:40,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 11:26:40,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +59: [2023-04-29 11:26:40,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 11:26:40,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 11:26:40,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +34: [2023-04-29 11:26:40,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 11:26:40,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 11:26:40,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +57: [2023-04-29 11:26:40,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 11:26:40,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 11:26:40,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 11:26:40,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 11:26:40,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 11:26:40,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 11:26:40,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 11:26:40,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +52: [2023-04-29 11:26:40,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 11:26:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 11:26:40,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 11:26:40,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 11:26:40,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 11:26:40,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 11:26:40,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 11:26:40,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 11:26:40,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 11:26:40,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 11:26:40,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +38: [2023-04-29 11:26:40,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 11:26:40,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +42: [2023-04-29 11:26:40,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +48: [2023-04-29 11:26:40,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 11:26:40,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +42: [2023-04-29 11:26:40,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +38: [2023-04-29 11:26:40,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 11:26:40,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 11:26:40,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 11:26:40,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +63: [2023-04-29 11:26:40,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 11:26:40,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +35: [2023-04-29 11:26:40,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 11:26:40,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:40,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 11:26:40,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +42: [2023-04-29 11:26:40,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +38: [2023-04-29 11:26:40,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 11:26:40,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 11:26:40,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 11:26:40,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +36: [2023-04-29 11:26:40,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +33: [2023-04-29 11:26:40,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +44: [2023-04-29 11:26:40,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 11:26:40,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 11:26:40,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 11:26:40,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +41: [2023-04-29 11:26:40,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 11:26:40,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +48: [2023-04-29 11:26:40,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 11:26:40,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 11:26:40,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 11:26:40,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +55: [2023-04-29 11:26:40,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 11:26:40,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +57: [2023-04-29 11:26:40,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:40,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 11:26:40,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 11:26:40,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 11:26:40,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +35: [2023-04-29 11:26:40,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:40,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 11:26:40,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 11:26:40,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 11:26:40,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 11:26:40,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 11:26:40,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 11:26:40,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +43: [2023-04-29 11:26:40,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 11:26:40,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +59: [2023-04-29 11:26:40,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 11:26:40,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 11:26:40,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 11:26:40,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 11:26:40,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 11:26:40,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 11:26:40,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 11:26:40,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 11:26:40,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +44: [2023-04-29 11:26:40,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 11:26:40,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 11:26:40,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +59: [2023-04-29 11:26:40,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 11:26:40,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 11:26:40,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 11:26:40,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 11:26:40,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 11:26:40,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:40,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 11:26:40,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 11:26:40,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +56: [2023-04-29 11:26:40,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:40,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +47: [2023-04-29 11:26:40,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +47: [2023-04-29 11:26:40,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +55: [2023-04-29 11:26:40,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 11:26:40,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 11:26:40,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 11:26:40,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 11:26:40,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 11:26:40,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +56: [2023-04-29 11:26:40,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 11:26:40,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:40,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 11:26:40,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 11:26:40,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 11:26:40,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 11:26:40,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 11:26:40,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 11:26:40,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +37: [2023-04-29 11:26:40,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +37: [2023-04-29 11:26:40,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 11:26:40,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +47: [2023-04-29 11:26:40,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 11:26:40,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 11:26:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +48: [2023-04-29 11:26:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 11:26:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +58: [2023-04-29 11:26:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +58: [2023-04-29 11:26:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +58: [2023-04-29 11:26:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +58: [2023-04-29 11:26:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +47: [2023-04-29 11:26:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +58: [2023-04-29 11:26:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +63: [2023-04-29 11:26:40,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:40,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +45: [2023-04-29 11:26:40,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +55: [2023-04-29 11:26:40,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 11:26:40,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 11:26:40,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 11:26:40,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:40,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +45: [2023-04-29 11:26:40,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +44: [2023-04-29 11:26:40,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 11:26:40,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 11:26:40,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 11:26:40,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 11:26:40,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +59: [2023-04-29 11:26:40,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 11:26:40,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 11:26:40,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 11:26:40,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 11:26:40,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 11:26:40,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:40,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +45: [2023-04-29 11:26:40,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +41: [2023-04-29 11:26:40,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 11:26:40,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 11:26:40,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 11:26:40,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:40,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt... +55: [2023-04-29 11:26:40,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 11:26:40,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:40,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt... +40: [2023-04-29 11:26:40,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 11:26:40,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 11:26:40,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +44: [2023-04-29 11:26:40,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +44: [2023-04-29 11:26:40,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +44: [2023-04-29 11:26:40,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 11:26:40,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 11:26:40,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 11:26:40,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 11:26:40,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +40: [2023-04-29 11:26:40,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 11:26:40,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 11:26:40,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 11:26:40,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 11:26:40,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 11:26:40,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 11:26:40,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 11:26:40,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 11:26:40,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 11:26:40,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 11:26:40,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +58: [2023-04-29 11:26:40,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +49: [2023-04-29 11:26:40,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:40,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 11:26:40,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 11:26:40,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +47: [2023-04-29 11:26:40,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 11:26:40,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:40,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +42: [2023-04-29 11:26:40,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 11:26:40,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:40,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_00-model_states.pt. +45: [2023-04-29 11:26:40,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 11:26:40,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 11:26:40,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 11:26:40,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:40,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 11:26:40,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:40,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:40,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:40,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:40,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:40,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 11:26:40,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 11:26:40,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 11:26:40,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 11:26:40,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 11:26:40,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 11:26:40,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 11:26:40,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 11:26:40,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 11:26:40,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +61: [2023-04-29 11:26:40,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +61: [2023-04-29 11:26:40,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +61: [2023-04-29 11:26:40,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +32: [2023-04-29 11:26:40,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 11:26:40,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 11:26:40,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 11:26:40,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 11:26:40,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +51: [2023-04-29 11:26:40,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +51: [2023-04-29 11:26:40,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +51: [2023-04-29 11:26:40,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +32: [2023-04-29 11:26:40,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 11:26:40,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 11:26:40,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 11:26:40,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 11:26:40,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 11:26:40,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 11:26:40,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 11:26:40,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 11:26:40,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 11:26:40,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 11:26:40,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 11:26:40,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 11:26:40,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 11:26:40,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 11:26:40,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 11:26:40,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 11:26:40,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +39: [2023-04-29 11:26:40,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +39: [2023-04-29 11:26:40,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +39: [2023-04-29 11:26:40,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 11:26:40,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 11:26:40,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 11:26:40,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 11:26:40,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 11:26:40,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 11:26:40,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 11:26:40,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 11:26:40,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +39: [2023-04-29 11:26:40,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +53: [2023-04-29 11:26:40,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +53: [2023-04-29 11:26:40,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +53: [2023-04-29 11:26:40,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +53: [2023-04-29 11:26:40,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +61: [2023-04-29 11:26:40,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 11:26:40,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 11:26:40,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 11:26:40,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 11:26:40,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 11:26:40,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 9: [2023-04-29 11:26:40,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 9: [2023-04-29 11:26:40,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 9: [2023-04-29 11:26:40,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +32: [2023-04-29 11:26:40,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +15: [2023-04-29 11:26:40,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +32: [2023-04-29 11:26:40,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +15: [2023-04-29 11:26:40,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +15: [2023-04-29 11:26:40,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 9: [2023-04-29 11:26:40,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +15: [2023-04-29 11:26:40,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +32: [2023-04-29 11:26:40,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +32: [2023-04-29 11:26:40,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +26: [2023-04-29 11:26:40,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +26: [2023-04-29 11:26:40,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +26: [2023-04-29 11:26:40,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +26: [2023-04-29 11:26:40,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +53: [2023-04-29 11:26:40,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 11:26:40,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 11:26:40,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 11:26:40,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +61: [2023-04-29 11:26:40,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 11:26:40,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 11:26:40,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +61: [2023-04-29 11:26:40,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 4: [2023-04-29 11:26:40,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +61: [2023-04-29 11:26:40,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +61: [2023-04-29 11:26:40,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 4: [2023-04-29 11:26:40,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 11:26:40,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +19: [2023-04-29 11:26:40,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +19: [2023-04-29 11:26:40,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +19: [2023-04-29 11:26:40,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +21: [2023-04-29 11:26:40,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +21: [2023-04-29 11:26:40,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 4: [2023-04-29 11:26:40,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 11:26:40,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +21: [2023-04-29 11:26:40,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 4: [2023-04-29 11:26:40,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 11:26:40,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 11:26:40,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 11:26:40,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 11:26:40,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +34: [2023-04-29 11:26:40,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +15: [2023-04-29 11:26:40,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +57: [2023-04-29 11:26:40,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +57: [2023-04-29 11:26:40,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +57: [2023-04-29 11:26:40,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +57: [2023-04-29 11:26:40,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +26: [2023-04-29 11:26:40,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 11:26:40,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +34: [2023-04-29 11:26:40,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +51: [2023-04-29 11:26:40,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 11:26:40,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 11:26:40,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 11:26:40,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 11:26:40,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 11:26:40,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 11:26:40,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 11:26:40,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +26: [2023-04-29 11:26:40,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +39: [2023-04-29 11:26:40,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +39: [2023-04-29 11:26:40,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +26: [2023-04-29 11:26:40,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 11:26:40,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +51: [2023-04-29 11:26:40,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 11:26:40,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 11:26:40,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 11:26:40,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +51: [2023-04-29 11:26:40,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +51: [2023-04-29 11:26:40,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +51: [2023-04-29 11:26:40,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +51: [2023-04-29 11:26:40,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +39: [2023-04-29 11:26:40,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +39: [2023-04-29 11:26:40,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 11:26:40,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +32: [2023-04-29 11:26:40,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 11:26:40,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +32: [2023-04-29 11:26:40,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 11:26:40,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 11:26:40,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +21: [2023-04-29 11:26:40,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +32: [2023-04-29 11:26:40,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +19: [2023-04-29 11:26:40,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +32: [2023-04-29 11:26:40,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +19: [2023-04-29 11:26:40,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 11:26:40,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 11:26:40,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 11:26:40,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +34: [2023-04-29 11:26:40,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 11:26:40,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +23: [2023-04-29 11:26:40,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +23: [2023-04-29 11:26:40,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +23: [2023-04-29 11:26:40,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +23: [2023-04-29 11:26:40,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +21: [2023-04-29 11:26:40,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 11:26:40,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 8: [2023-04-29 11:26:40,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +34: [2023-04-29 11:26:40,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 11:26:40,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 11:26:40,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +57: [2023-04-29 11:26:40,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 11:26:40,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +60: [2023-04-29 11:26:40,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +60: [2023-04-29 11:26:40,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +57: [2023-04-29 11:26:40,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 11:26:40,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 4: [2023-04-29 11:26:40,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +60: [2023-04-29 11:26:40,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +60: [2023-04-29 11:26:40,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 8: [2023-04-29 11:26:40,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +39: [2023-04-29 11:26:40,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 11:26:40,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 8: [2023-04-29 11:26:40,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 8: [2023-04-29 11:26:40,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 8: [2023-04-29 11:26:40,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 11:26:40,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 11:26:40,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +39: [2023-04-29 11:26:40,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +19: [2023-04-29 11:26:40,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 11:26:40,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +48: [2023-04-29 11:26:40,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +48: [2023-04-29 11:26:40,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +48: [2023-04-29 11:26:40,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +48: [2023-04-29 11:26:40,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +39: [2023-04-29 11:26:40,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 11:26:40,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 11:26:40,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 11:26:40,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 11:26:40,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +59: [2023-04-29 11:26:40,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +59: [2023-04-29 11:26:40,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +59: [2023-04-29 11:26:40,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +59: [2023-04-29 11:26:40,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +23: [2023-04-29 11:26:40,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 11:26:40,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 11:26:40,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 11:26:40,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +60: [2023-04-29 11:26:40,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +60: [2023-04-29 11:26:40,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 11:26:40,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 11:26:40,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +16: [2023-04-29 11:26:40,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 11:26:40,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 11:26:40,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 11:26:40,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +48: [2023-04-29 11:26:40,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 11:26:40,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 11:26:40,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 11:26:40,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +30: [2023-04-29 11:26:40,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +30: [2023-04-29 11:26:40,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +30: [2023-04-29 11:26:40,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +30: [2023-04-29 11:26:40,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +50: [2023-04-29 11:26:40,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +50: [2023-04-29 11:26:40,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +16: [2023-04-29 11:26:40,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 11:26:40,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +50: [2023-04-29 11:26:40,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +50: [2023-04-29 11:26:40,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +16: [2023-04-29 11:26:40,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 11:26:40,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +62: [2023-04-29 11:26:40,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 11:26:40,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 11:26:40,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 11:26:40,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 11:26:40,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +54: [2023-04-29 11:26:40,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 9: [2023-04-29 11:26:40,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +52: [2023-04-29 11:26:40,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +52: [2023-04-29 11:26:40,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +54: [2023-04-29 11:26:40,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +54: [2023-04-29 11:26:40,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +59: [2023-04-29 11:26:40,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +59: [2023-04-29 11:26:40,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +59: [2023-04-29 11:26:40,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 11:26:40,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 9: [2023-04-29 11:26:40,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +52: [2023-04-29 11:26:40,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +62: [2023-04-29 11:26:40,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +62: [2023-04-29 11:26:40,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +62: [2023-04-29 11:26:40,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 11:26:40,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +38: [2023-04-29 11:26:40,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +38: [2023-04-29 11:26:40,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +38: [2023-04-29 11:26:40,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +38: [2023-04-29 11:26:40,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +39: [2023-04-29 11:26:40,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +39: [2023-04-29 11:26:40,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +39: [2023-04-29 11:26:40,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +62: [2023-04-29 11:26:40,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +59: [2023-04-29 11:26:40,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 11:26:40,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 5: [2023-04-29 11:26:40,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +37: [2023-04-29 11:26:40,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +37: [2023-04-29 11:26:40,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +37: [2023-04-29 11:26:40,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +34: [2023-04-29 11:26:40,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +34: [2023-04-29 11:26:40,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +34: [2023-04-29 11:26:40,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +34: [2023-04-29 11:26:40,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 11:26:40,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +53: [2023-04-29 11:26:40,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 11:26:40,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 11:26:40,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 11:26:40,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 11:26:40,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 11:26:40,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 11:26:40,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 11:26:40,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 11:26:40,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 11:26:40,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 11:26:40,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 11:26:40,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 11:26:40,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 11:26:40,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 11:26:40,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 5: [2023-04-29 11:26:40,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 11:26:40,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 11:26:40,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 11:26:40,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 5: [2023-04-29 11:26:40,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 11:26:40,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +53: [2023-04-29 11:26:40,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 11:26:40,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 11:26:40,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +53: [2023-04-29 11:26:40,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +53: [2023-04-29 11:26:40,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 9: [2023-04-29 11:26:40,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +53: [2023-04-29 11:26:40,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 11:26:40,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +34: [2023-04-29 11:26:40,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +54: [2023-04-29 11:26:40,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 11:26:40,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 11:26:40,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +30: [2023-04-29 11:26:40,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +32: [2023-04-29 11:26:40,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 11:26:40,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 11:26:40,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +30: [2023-04-29 11:26:40,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 11:26:40,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +54: [2023-04-29 11:26:40,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +54: [2023-04-29 11:26:40,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +54: [2023-04-29 11:26:40,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 11:26:40,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 11:26:40,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 11:26:40,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 6: [2023-04-29 11:26:40,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 6: [2023-04-29 11:26:40,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 6: [2023-04-29 11:26:40,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 6: [2023-04-29 11:26:40,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +19: [2023-04-29 11:26:40,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +52: [2023-04-29 11:26:41,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 11:26:41,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +32: [2023-04-29 11:26:41,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 11:26:41,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 11:26:41,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +32: [2023-04-29 11:26:41,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 11:26:41,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 11:26:41,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 11:26:41,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +34: [2023-04-29 11:26:41,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 11:26:41,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +32: [2023-04-29 11:26:41,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +19: [2023-04-29 11:26:41,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 11:26:41,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +52: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +26: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +51: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +26: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +38: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +46: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +54: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +46: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +46: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 8: [2023-04-29 11:26:41,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +38: [2023-04-29 11:26:41,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 11:26:41,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +41: [2023-04-29 11:26:41,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +41: [2023-04-29 11:26:41,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +41: [2023-04-29 11:26:41,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 9: [2023-04-29 11:26:41,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +39: [2023-04-29 11:26:41,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 11:26:41,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 11:26:41,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 11:26:41,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +34: [2023-04-29 11:26:41,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +39: [2023-04-29 11:26:41,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 11:26:41,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 11:26:41,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 11:26:41,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +33: [2023-04-29 11:26:41,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +33: [2023-04-29 11:26:41,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +33: [2023-04-29 11:26:41,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +19: [2023-04-29 11:26:41,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 9: [2023-04-29 11:26:41,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +32: [2023-04-29 11:26:41,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +32: [2023-04-29 11:26:41,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 7: [2023-04-29 11:26:41,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +32: [2023-04-29 11:26:41,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +19: [2023-04-29 11:26:41,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 11:26:41,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +37: [2023-04-29 11:26:41,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +26: [2023-04-29 11:26:41,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +26: [2023-04-29 11:26:41,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 11:26:41,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +26: [2023-04-29 11:26:41,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +31: [2023-04-29 11:26:41,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +31: [2023-04-29 11:26:41,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +31: [2023-04-29 11:26:41,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +31: [2023-04-29 11:26:41,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +37: [2023-04-29 11:26:41,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +26: [2023-04-29 11:26:41,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +34: [2023-04-29 11:26:41,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +26: [2023-04-29 11:26:41,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +26: [2023-04-29 11:26:41,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:41,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +24: [2023-04-29 11:26:41,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +62: [2023-04-29 11:26:41,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +62: [2023-04-29 11:26:41,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +62: [2023-04-29 11:26:41,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +34: [2023-04-29 11:26:41,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +24: [2023-04-29 11:26:41,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 8: [2023-04-29 11:26:41,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 8: [2023-04-29 11:26:41,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +62: [2023-04-29 11:26:41,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 8: [2023-04-29 11:26:41,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +24: [2023-04-29 11:26:41,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +26: [2023-04-29 11:26:41,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +37: [2023-04-29 11:26:41,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 11:26:41,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +51: [2023-04-29 11:26:41,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +60: [2023-04-29 11:26:41,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 11:26:41,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +19: [2023-04-29 11:26:41,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +19: [2023-04-29 11:26:41,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +51: [2023-04-29 11:26:41,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +60: [2023-04-29 11:26:41,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 11:26:41,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +51: [2023-04-29 11:26:41,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 11:26:41,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +18: [2023-04-29 11:26:41,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +18: [2023-04-29 11:26:41,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +18: [2023-04-29 11:26:41,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +22: [2023-04-29 11:26:41,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +22: [2023-04-29 11:26:41,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +22: [2023-04-29 11:26:41,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +22: [2023-04-29 11:26:41,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +19: [2023-04-29 11:26:41,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 11:26:41,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +60: [2023-04-29 11:26:41,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +34: [2023-04-29 11:26:41,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +60: [2023-04-29 11:26:41,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 11:26:41,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +19: [2023-04-29 11:26:41,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +19: [2023-04-29 11:26:41,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +33: [2023-04-29 11:26:41,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +13: [2023-04-29 11:26:41,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +13: [2023-04-29 11:26:41,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +13: [2023-04-29 11:26:41,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +33: [2023-04-29 11:26:41,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 11:26:41,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 11:26:41,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +13: [2023-04-29 11:26:41,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +60: [2023-04-29 11:26:41,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 11:26:41,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 11:26:41,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 11:26:41,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +46: [2023-04-29 11:26:41,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 11:26:41,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 11:26:41,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +43: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +60: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +12: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +12: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +12: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +43: [2023-04-29 11:26:41,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +12: [2023-04-29 11:26:41,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +33: [2023-04-29 11:26:41,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +33: [2023-04-29 11:26:41,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +47: [2023-04-29 11:26:41,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +47: [2023-04-29 11:26:41,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +33: [2023-04-29 11:26:41,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 11:26:41,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 11:26:41,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 11:26:41,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 11:26:41,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 11:26:41,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 11:26:41,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +60: [2023-04-29 11:26:41,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +60: [2023-04-29 11:26:41,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +33: [2023-04-29 11:26:41,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 11:26:41,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 11:26:41,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +16: [2023-04-29 11:26:41,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +60: [2023-04-29 11:26:41,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 11:26:41,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +31: [2023-04-29 11:26:41,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +47: [2023-04-29 11:26:41,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +31: [2023-04-29 11:26:41,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:41,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:41,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +60: [2023-04-29 11:26:41,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +31: [2023-04-29 11:26:41,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +60: [2023-04-29 11:26:41,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +31: [2023-04-29 11:26:41,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:41,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:41,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +62: [2023-04-29 11:26:41,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +38: [2023-04-29 11:26:41,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 11:26:41,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 11:26:41,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 11:26:41,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +18: [2023-04-29 11:26:41,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +18: [2023-04-29 11:26:41,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 11:26:41,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +62: [2023-04-29 11:26:41,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +22: [2023-04-29 11:26:41,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +62: [2023-04-29 11:26:41,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +22: [2023-04-29 11:26:41,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 11:26:41,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +62: [2023-04-29 11:26:41,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +16: [2023-04-29 11:26:41,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 11:26:41,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 11:26:41,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 11:26:41,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 11:26:41,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +19: [2023-04-29 11:26:41,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +38: [2023-04-29 11:26:41,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 11:26:41,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +13: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 1: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 1: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +18: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +38: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +12: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +38: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +13: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +11: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +11: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +12: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +12: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +38: [2023-04-29 11:26:41,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +19: [2023-04-29 11:26:41,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +19: [2023-04-29 11:26:41,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +27: [2023-04-29 11:26:41,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +27: [2023-04-29 11:26:41,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +27: [2023-04-29 11:26:41,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +27: [2023-04-29 11:26:41,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +47: [2023-04-29 11:26:41,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:41,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +13: [2023-04-29 11:26:41,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 11:26:41,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 11:26:41,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 3: [2023-04-29 11:26:41,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 3: [2023-04-29 11:26:41,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 3: [2023-04-29 11:26:41,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +47: [2023-04-29 11:26:41,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +53: [2023-04-29 11:26:41,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 11:26:41,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 0: [2023-04-29 11:26:41,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 0: [2023-04-29 11:26:41,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +36: [2023-04-29 11:26:41,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 11:26:41,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 11:26:41,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 11:26:41,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +16: [2023-04-29 11:26:41,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +47: [2023-04-29 11:26:41,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +62: [2023-04-29 11:26:41,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 11:26:41,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 11:26:41,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 11:26:41,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +10: [2023-04-29 11:26:41,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +53: [2023-04-29 11:26:41,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +53: [2023-04-29 11:26:41,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +17: [2023-04-29 11:26:41,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +17: [2023-04-29 11:26:41,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +17: [2023-04-29 11:26:41,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +50: [2023-04-29 11:26:41,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 11:26:41,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 11:26:41,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 11:26:41,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 11:26:41,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +17: [2023-04-29 11:26:41,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +10: [2023-04-29 11:26:41,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +10: [2023-04-29 11:26:41,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +36: [2023-04-29 11:26:41,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +10: [2023-04-29 11:26:41,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +63: [2023-04-29 11:26:41,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 11:26:41,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 11:26:41,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 11:26:41,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +25: [2023-04-29 11:26:41,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +25: [2023-04-29 11:26:41,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +36: [2023-04-29 11:26:41,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +25: [2023-04-29 11:26:41,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +25: [2023-04-29 11:26:41,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 5: [2023-04-29 11:26:41,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +63: [2023-04-29 11:26:41,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +63: [2023-04-29 11:26:41,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 11:26:41,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 11:26:41,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +29: [2023-04-29 11:26:41,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +29: [2023-04-29 11:26:41,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +29: [2023-04-29 11:26:41,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +29: [2023-04-29 11:26:41,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +54: [2023-04-29 11:26:41,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 11:26:41,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 11:26:41,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +59: [2023-04-29 11:26:41,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 8: [2023-04-29 11:26:41,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +63: [2023-04-29 11:26:41,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 11:26:41,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 11:26:41,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 11:26:41,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +34: [2023-04-29 11:26:41,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 11:26:41,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +63: [2023-04-29 11:26:41,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 11:26:41,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 11:26:41,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +11: [2023-04-29 11:26:41,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +50: [2023-04-29 11:26:41,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +50: [2023-04-29 11:26:41,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 1: [2023-04-29 11:26:41,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +50: [2023-04-29 11:26:41,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +54: [2023-04-29 11:26:41,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 11:26:41,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 11:26:41,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +50: [2023-04-29 11:26:41,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 1: [2023-04-29 11:26:41,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 11:26:41,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +34: [2023-04-29 11:26:41,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 11:26:41,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +34: [2023-04-29 11:26:41,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 11:26:41,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 11:26:41,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +59: [2023-04-29 11:26:41,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +54: [2023-04-29 11:26:41,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +11: [2023-04-29 11:26:41,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 11:26:41,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 11:26:41,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +59: [2023-04-29 11:26:41,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +54: [2023-04-29 11:26:41,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 11:26:41,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +26: [2023-04-29 11:26:41,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 11:26:41,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 11:26:41,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 11:26:41,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 11:26:41,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +16: [2023-04-29 11:26:41,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +16: [2023-04-29 11:26:41,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +38: [2023-04-29 11:26:41,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 11:26:41,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 2: [2023-04-29 11:26:41,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 2: [2023-04-29 11:26:41,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 2: [2023-04-29 11:26:41,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +16: [2023-04-29 11:26:41,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +54: [2023-04-29 11:26:41,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +27: [2023-04-29 11:26:41,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +45: [2023-04-29 11:26:41,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +27: [2023-04-29 11:26:41,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +45: [2023-04-29 11:26:41,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +45: [2023-04-29 11:26:41,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +16: [2023-04-29 11:26:41,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +54: [2023-04-29 11:26:41,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +45: [2023-04-29 11:26:41,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +44: [2023-04-29 11:26:41,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +44: [2023-04-29 11:26:41,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +44: [2023-04-29 11:26:41,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +44: [2023-04-29 11:26:41,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 5: [2023-04-29 11:26:41,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +38: [2023-04-29 11:26:41,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 11:26:41,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 11:26:41,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +17: [2023-04-29 11:26:41,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 11:26:41,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 11:26:41,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 11:26:41,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 11:26:41,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +35: [2023-04-29 11:26:41,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +35: [2023-04-29 11:26:41,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +10: [2023-04-29 11:26:41,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +53: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +54: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +35: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +30: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +38: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +38: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +30: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +54: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +30: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +39: [2023-04-29 11:26:41,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +25: [2023-04-29 11:26:41,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +14: [2023-04-29 11:26:41,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +14: [2023-04-29 11:26:41,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +39: [2023-04-29 11:26:41,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +14: [2023-04-29 11:26:41,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +25: [2023-04-29 11:26:41,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +54: [2023-04-29 11:26:41,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 11:26:41,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 11:26:41,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +14: [2023-04-29 11:26:41,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +30: [2023-04-29 11:26:41,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +39: [2023-04-29 11:26:41,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +17: [2023-04-29 11:26:41,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +62: [2023-04-29 11:26:41,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +27: [2023-04-29 11:26:41,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 11:26:41,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +53: [2023-04-29 11:26:41,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 11:26:41,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 11:26:41,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 11:26:41,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +10: [2023-04-29 11:26:41,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 11:26:41,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 11:26:41,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +38: [2023-04-29 11:26:41,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +38: [2023-04-29 11:26:41,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +39: [2023-04-29 11:26:41,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 11:26:41,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +30: [2023-04-29 11:26:41,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +30: [2023-04-29 11:26:41,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +30: [2023-04-29 11:26:41,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +33: [2023-04-29 11:26:41,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +30: [2023-04-29 11:26:41,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 11:26:41,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +30: [2023-04-29 11:26:41,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +36: [2023-04-29 11:26:41,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +36: [2023-04-29 11:26:41,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +30: [2023-04-29 11:26:41,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +30: [2023-04-29 11:26:41,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +35: [2023-04-29 11:26:41,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 11:26:41,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 11:26:41,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +63: [2023-04-29 11:26:41,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +28: [2023-04-29 11:26:41,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +28: [2023-04-29 11:26:41,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +29: [2023-04-29 11:26:41,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 11:26:41,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +35: [2023-04-29 11:26:41,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +54: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +28: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +43: [2023-04-29 11:26:41,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +60: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +27: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +35: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +63: [2023-04-29 11:26:41,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +47: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 11:26:41,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 11:26:41,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 11:26:41,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 11:26:41,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +54: [2023-04-29 11:26:41,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 11:26:41,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 11:26:41,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +25: [2023-04-29 11:26:41,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 11:26:41,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 11:26:41,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 11:26:41,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +36: [2023-04-29 11:26:41,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +29: [2023-04-29 11:26:41,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +54: [2023-04-29 11:26:41,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 11:26:41,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +39: [2023-04-29 11:26:41,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +36: [2023-04-29 11:26:41,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +40: [2023-04-29 11:26:41,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +39: [2023-04-29 11:26:41,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 5: [2023-04-29 11:26:41,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 5: [2023-04-29 11:26:41,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +63: [2023-04-29 11:26:41,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +40: [2023-04-29 11:26:41,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 11:26:41,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +34: [2023-04-29 11:26:41,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 11:26:41,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +34: [2023-04-29 11:26:41,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 11:26:41,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +29: [2023-04-29 11:26:41,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +35: [2023-04-29 11:26:41,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +45: [2023-04-29 11:26:41,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +44: [2023-04-29 11:26:41,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:41,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:41,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +39: [2023-04-29 11:26:41,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +40: [2023-04-29 11:26:41,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +16: [2023-04-29 11:26:41,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +47: [2023-04-29 11:26:41,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +25: [2023-04-29 11:26:41,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 11:26:41,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 11:26:41,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 11:26:41,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +33: [2023-04-29 11:26:41,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 11:26:41,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 11:26:41,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +43: [2023-04-29 11:26:41,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +25: [2023-04-29 11:26:41,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +35: [2023-04-29 11:26:41,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +16: [2023-04-29 11:26:41,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +27: [2023-04-29 11:26:41,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +43: [2023-04-29 11:26:41,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +43: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +27: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +44: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +20: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +20: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +20: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +44: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +16: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +44: [2023-04-29 11:26:41,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +27: [2023-04-29 11:26:41,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +47: [2023-04-29 11:26:41,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 11:26:41,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +40: [2023-04-29 11:26:41,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 11:26:41,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +56: [2023-04-29 11:26:41,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +55: [2023-04-29 11:26:41,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +55: [2023-04-29 11:26:41,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +45: [2023-04-29 11:26:41,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:41,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +26: [2023-04-29 11:26:41,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +34: [2023-04-29 11:26:41,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 11:26:41,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 11:26:41,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 11:26:41,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +33: [2023-04-29 11:26:41,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 11:26:41,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 11:26:41,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 11:26:41,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +42: [2023-04-29 11:26:41,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +56: [2023-04-29 11:26:41,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +33: [2023-04-29 11:26:41,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 11:26:41,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +55: [2023-04-29 11:26:41,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +56: [2023-04-29 11:26:41,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +35: [2023-04-29 11:26:41,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +26: [2023-04-29 11:26:41,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 11:26:41,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +35: [2023-04-29 11:26:41,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 7: [2023-04-29 11:26:41,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +42: [2023-04-29 11:26:41,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +26: [2023-04-29 11:26:41,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +38: [2023-04-29 11:26:41,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +26: [2023-04-29 11:26:41,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +58: [2023-04-29 11:26:41,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +58: [2023-04-29 11:26:41,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 3: [2023-04-29 11:26:41,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +58: [2023-04-29 11:26:41,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 2: [2023-04-29 11:26:41,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +58: [2023-04-29 11:26:41,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +33: [2023-04-29 11:26:41,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +33: [2023-04-29 11:26:41,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +35: [2023-04-29 11:26:41,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 11:26:41,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +14: [2023-04-29 11:26:41,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 11:26:41,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 11:26:41,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +33: [2023-04-29 11:26:41,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 11:26:41,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +63: [2023-04-29 11:26:41,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 11:26:41,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +49: [2023-04-29 11:26:41,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 8: [2023-04-29 11:26:41,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +36: [2023-04-29 11:26:41,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +36: [2023-04-29 11:26:41,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 11:26:41,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +14: [2023-04-29 11:26:41,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +63: [2023-04-29 11:26:41,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +14: [2023-04-29 11:26:41,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +49: [2023-04-29 11:26:41,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +49: [2023-04-29 11:26:41,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +63: [2023-04-29 11:26:41,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +28: [2023-04-29 11:26:41,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 11:26:41,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. + 4: [2023-04-29 11:26:41,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +38: [2023-04-29 11:26:41,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +62: [2023-04-29 11:26:41,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 11:26:41,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_01-model_01-model_states.pt. +36: [2023-04-29 11:26:41,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:41,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 11:26:41,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 11:26:41,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +14: [2023-04-29 11:26:41,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +38: [2023-04-29 11:26:41,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 11:26:41,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 11:26:41,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 11:26:41,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 11:26:41,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 11:26:41,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 11:26:41,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +62: [2023-04-29 11:26:41,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 11:26:41,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 11:26:41,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +43: [2023-04-29 11:26:41,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 11:26:41,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +60: [2023-04-29 11:26:41,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +52: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +24: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +47: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +47: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +52: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +24: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +52: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 11:26:41,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:41,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 11:26:41,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 11:26:41,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 11:26:41,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +62: [2023-04-29 11:26:41,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +62: [2023-04-29 11:26:41,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +20: [2023-04-29 11:26:41,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:41,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 11:26:41,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +45: [2023-04-29 11:26:41,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:41,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:41,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +60: [2023-04-29 11:26:41,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 11:26:41,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +62: [2023-04-29 11:26:41,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +62: [2023-04-29 11:26:41,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +45: [2023-04-29 11:26:41,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 11:26:41,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 11:26:41,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 11:26:41,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +43: [2023-04-29 11:26:41,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:41,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 11:26:41,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 11:26:41,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 11:26:41,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 11:26:41,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 11:26:41,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 11:26:41,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +20: [2023-04-29 11:26:41,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 11:26:41,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +37: [2023-04-29 11:26:41,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:41,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +43: [2023-04-29 11:26:41,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +43: [2023-04-29 11:26:41,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 11:26:41,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +42: [2023-04-29 11:26:41,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 11:26:41,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +52: [2023-04-29 11:26:41,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 11:26:41,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 11:26:41,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 11:26:41,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 11:26:41,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +56: [2023-04-29 11:26:41,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +52: [2023-04-29 11:26:41,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +52: [2023-04-29 11:26:41,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +52: [2023-04-29 11:26:41,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +33: [2023-04-29 11:26:41,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 11:26:41,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 11:26:41,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +36: [2023-04-29 11:26:41,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 11:26:41,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:41,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +58: [2023-04-29 11:26:41,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 11:26:41,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 11:26:41,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +58: [2023-04-29 11:26:41,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 11:26:41,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +24: [2023-04-29 11:26:41,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:41,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +24: [2023-04-29 11:26:41,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +24: [2023-04-29 11:26:41,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:41,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +57: [2023-04-29 11:26:41,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 11:26:41,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +38: [2023-04-29 11:26:41,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 11:26:41,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 11:26:41,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 11:26:41,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 11:26:41,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 11:26:41,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 11:26:41,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 11:26:41,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 11:26:41,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 11:26:41,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 11:26:41,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 11:26:41,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +33: [2023-04-29 11:26:41,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 11:26:41,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 11:26:41,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +37: [2023-04-29 11:26:41,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +55: [2023-04-29 11:26:41,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +33: [2023-04-29 11:26:41,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 11:26:41,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +55: [2023-04-29 11:26:41,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 11:26:41,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 8: [2023-04-29 11:26:41,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +37: [2023-04-29 11:26:41,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 11:26:41,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 11:26:41,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 3: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +57: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +44: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +44: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +37: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +21: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +50: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +50: [2023-04-29 11:26:41,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +21: [2023-04-29 11:26:41,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 11:26:41,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 11:26:41,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +49: [2023-04-29 11:26:41,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +21: [2023-04-29 11:26:41,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 11:26:41,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +44: [2023-04-29 11:26:41,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 11:26:41,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +17: [2023-04-29 11:26:41,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 11:26:41,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +57: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +57: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +57: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 4: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +55: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +55: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +17: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +36: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 11:26:41,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +44: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +57: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 2: [2023-04-29 11:26:41,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +57: [2023-04-29 11:26:41,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +49: [2023-04-29 11:26:41,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +55: [2023-04-29 11:26:41,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +55: [2023-04-29 11:26:41,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 11:26:41,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +50: [2023-04-29 11:26:41,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 11:26:41,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 11:26:41,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 0: [2023-04-29 11:26:41,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 11:26:41,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 11:26:41,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +38: [2023-04-29 11:26:41,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 11:26:41,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +21: [2023-04-29 11:26:41,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +40: [2023-04-29 11:26:41,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +40: [2023-04-29 11:26:41,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +40: [2023-04-29 11:26:41,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. +38: [2023-04-29 11:26:41,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +21: [2023-04-29 11:26:41,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +21: [2023-04-29 11:26:41,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +63: [2023-04-29 11:26:41,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 11:26:41,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 11:26:41,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 11:26:41,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +55: [2023-04-29 11:26:41,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +40: [2023-04-29 11:26:41,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_24-model_01-model_states.pt. + 0: [2023-04-29 11:26:41,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +59: [2023-04-29 11:26:41,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +30: [2023-04-29 11:26:41,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 11:26:41,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +17: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 6: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +22: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +15: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 11:26:41,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +22: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 11:26:41,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 11:26:41,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 11:26:41,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 11:26:41,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 11:26:41,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +55: [2023-04-29 11:26:41,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +18: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +36: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +18: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 11:26:41,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 11:26:41,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 11:26:41,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 11:26:41,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 11:26:41,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 11:26:41,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +25: [2023-04-29 11:26:41,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 11:26:41,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 11:26:41,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 11:26:41,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 11:26:41,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 11:26:41,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 11:26:41,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 11:26:41,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +55: [2023-04-29 11:26:41,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +17: [2023-04-29 11:26:41,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 11:26:41,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +55: [2023-04-29 11:26:41,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 3: [2023-04-29 11:26:41,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +20: [2023-04-29 11:26:41,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 11:26:41,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +41: [2023-04-29 11:26:41,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 11:26:41,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +22: [2023-04-29 11:26:41,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 11:26:41,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +22: [2023-04-29 11:26:41,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +42: [2023-04-29 11:26:41,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 11:26:41,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +20: [2023-04-29 11:26:41,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 11:26:41,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 11:26:41,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 11:26:41,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 11:26:41,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 11:26:41,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 11:26:41,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +63: [2023-04-29 11:26:41,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +25: [2023-04-29 11:26:41,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +25: [2023-04-29 11:26:41,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +18: [2023-04-29 11:26:41,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +25: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +46: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +15: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +30: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +30: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +46: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +31: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +46: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +31: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +46: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +27: [2023-04-29 11:26:41,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +27: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +31: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +47: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +18: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +18: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +18: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +15: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +31: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +18: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +25: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +15: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +10: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +41: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 11:26:41,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +31: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +41: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +15: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +18: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +18: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +42: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +10: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +23: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +15: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +13: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +42: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +13: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +23: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +13: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +13: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +13: [2023-04-29 11:26:41,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +42: [2023-04-29 11:26:41,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 11:26:41,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 11:26:41,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 11:26:41,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 11:26:41,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 11:26:41,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +22: [2023-04-29 11:26:41,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +41: [2023-04-29 11:26:41,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 11:26:41,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +46: [2023-04-29 11:26:41,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +46: [2023-04-29 11:26:41,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +25: [2023-04-29 11:26:41,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +46: [2023-04-29 11:26:41,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +46: [2023-04-29 11:26:41,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +46: [2023-04-29 11:26:41,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 11:26:41,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +25: [2023-04-29 11:26:41,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 11:26:41,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +23: [2023-04-29 11:26:41,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +46: [2023-04-29 11:26:41,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +41: [2023-04-29 11:26:41,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +46: [2023-04-29 11:26:41,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +42: [2023-04-29 11:26:41,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +17: [2023-04-29 11:26:41,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +17: [2023-04-29 11:26:41,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +46: [2023-04-29 11:26:41,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +41: [2023-04-29 11:26:41,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +27: [2023-04-29 11:26:41,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +27: [2023-04-29 11:26:41,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +23: [2023-04-29 11:26:41,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 11:26:41,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +23: [2023-04-29 11:26:41,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +40: [2023-04-29 11:26:41,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +41: [2023-04-29 11:26:41,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +10: [2023-04-29 11:26:41,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +41: [2023-04-29 11:26:41,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +17: [2023-04-29 11:26:41,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +36: [2023-04-29 11:26:41,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 11:26:41,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 3: [2023-04-29 11:26:41,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +23: [2023-04-29 11:26:41,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +23: [2023-04-29 11:26:41,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +16: [2023-04-29 11:26:41,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 11:26:41,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +50: [2023-04-29 11:26:41,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +10: [2023-04-29 11:26:41,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 11:26:41,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +45: [2023-04-29 11:26:41,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 11:26:41,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 11:26:41,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +27: [2023-04-29 11:26:41,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 11:26:41,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +10: [2023-04-29 11:26:41,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +56: [2023-04-29 11:26:41,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 11:26:41,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +10: [2023-04-29 11:26:41,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +25: [2023-04-29 11:26:41,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +40: [2023-04-29 11:26:41,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 11:26:41,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 11:26:41,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 11:26:41,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 11:26:41,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 11:26:41,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +25: [2023-04-29 11:26:41,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 11:26:41,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 11:26:41,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +36: [2023-04-29 11:26:41,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +16: [2023-04-29 11:26:41,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +36: [2023-04-29 11:26:41,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +27: [2023-04-29 11:26:41,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 11:26:41,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +63: [2023-04-29 11:26:41,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 11:26:41,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 11:26:41,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 11:26:41,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 11:26:41,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +50: [2023-04-29 11:26:41,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 11:26:41,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 11:26:41,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +16: [2023-04-29 11:26:41,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +50: [2023-04-29 11:26:41,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +16: [2023-04-29 11:26:41,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +16: [2023-04-29 11:26:41,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +25: [2023-04-29 11:26:41,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +44: [2023-04-29 11:26:41,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 11:26:41,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +63: [2023-04-29 11:26:41,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 11:26:41,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 11:26:41,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 11:26:41,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 11:26:41,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 11:26:41,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +35: [2023-04-29 11:26:41,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 11:26:41,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +30: [2023-04-29 11:26:41,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +16: [2023-04-29 11:26:41,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +35: [2023-04-29 11:26:41,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +14: [2023-04-29 11:26:41,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 11:26:41,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 11:26:41,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +56: [2023-04-29 11:26:41,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +56: [2023-04-29 11:26:41,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +14: [2023-04-29 11:26:41,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 11:26:41,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 11:26:41,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +44: [2023-04-29 11:26:41,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +16: [2023-04-29 11:26:41,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +45: [2023-04-29 11:26:41,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +44: [2023-04-29 11:26:41,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +44: [2023-04-29 11:26:41,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +47: [2023-04-29 11:26:41,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +36: [2023-04-29 11:26:41,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 11:26:41,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 11:26:41,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 11:26:41,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 11:26:41,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 11:26:41,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 11:26:41,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 11:26:41,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +59: [2023-04-29 11:26:41,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +30: [2023-04-29 11:26:41,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 11:26:41,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +35: [2023-04-29 11:26:41,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +30: [2023-04-29 11:26:41,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 11:26:41,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +35: [2023-04-29 11:26:41,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 11:26:41,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 11:26:41,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +45: [2023-04-29 11:26:41,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 11:26:41,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +52: [2023-04-29 11:26:41,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 11:26:41,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 11:26:41,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 11:26:41,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 11:26:41,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +36: [2023-04-29 11:26:41,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +14: [2023-04-29 11:26:41,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 11:26:41,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 11:26:41,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +59: [2023-04-29 11:26:41,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +25: [2023-04-29 11:26:41,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +36: [2023-04-29 11:26:41,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +59: [2023-04-29 11:26:41,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +14: [2023-04-29 11:26:41,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +52: [2023-04-29 11:26:41,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 11:26:41,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 11:26:41,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 11:26:41,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +14: [2023-04-29 11:26:41,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +14: [2023-04-29 11:26:41,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +52: [2023-04-29 11:26:41,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +14: [2023-04-29 11:26:41,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +14: [2023-04-29 11:26:41,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +40: [2023-04-29 11:26:41,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 11:26:41,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +20: [2023-04-29 11:26:41,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +63: [2023-04-29 11:26:41,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +63: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +63: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +24: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 2: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 2: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 2: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +49: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +43: [2023-04-29 11:26:41,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 11:26:41,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +36: [2023-04-29 11:26:41,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 5: [2023-04-29 11:26:41,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 11:26:41,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 5: [2023-04-29 11:26:41,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +59: [2023-04-29 11:26:41,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 11:26:41,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 11:26:41,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +25: [2023-04-29 11:26:41,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +40: [2023-04-29 11:26:41,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 11:26:41,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +35: [2023-04-29 11:26:41,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +35: [2023-04-29 11:26:41,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +35: [2023-04-29 11:26:41,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +25: [2023-04-29 11:26:41,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +56: [2023-04-29 11:26:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 11:26:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 11:26:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 11:26:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 11:26:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 11:26:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 11:26:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 11:26:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 11:26:41,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 11:26:41,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +47: [2023-04-29 11:26:41,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 11:26:41,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 11:26:41,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 11:26:41,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +20: [2023-04-29 11:26:41,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +43: [2023-04-29 11:26:41,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +43: [2023-04-29 11:26:41,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +43: [2023-04-29 11:26:41,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +49: [2023-04-29 11:26:41,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 11:26:41,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +43: [2023-04-29 11:26:41,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +56: [2023-04-29 11:26:41,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 11:26:41,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 11:26:41,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 11:26:41,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 11:26:41,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 11:26:41,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 11:26:41,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +63: [2023-04-29 11:26:41,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +25: [2023-04-29 11:26:41,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +21: [2023-04-29 11:26:41,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +45: [2023-04-29 11:26:41,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +20: [2023-04-29 11:26:41,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 5: [2023-04-29 11:26:41,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +57: [2023-04-29 11:26:41,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 11:26:41,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +45: [2023-04-29 11:26:41,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +35: [2023-04-29 11:26:41,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +49: [2023-04-29 11:26:41,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 11:26:41,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +36: [2023-04-29 11:26:41,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +37: [2023-04-29 11:26:41,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 11:26:41,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 11:26:41,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +49: [2023-04-29 11:26:41,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +47: [2023-04-29 11:26:41,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +48: [2023-04-29 11:26:41,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 11:26:41,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +48: [2023-04-29 11:26:41,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +48: [2023-04-29 11:26:41,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +48: [2023-04-29 11:26:41,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +20: [2023-04-29 11:26:41,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 11:26:41,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +44: [2023-04-29 11:26:41,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 11:26:41,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +20: [2023-04-29 11:26:41,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +48: [2023-04-29 11:26:41,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +35: [2023-04-29 11:26:41,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 11:26:41,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +12: [2023-04-29 11:26:41,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 11:26:41,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 11:26:41,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 11:26:41,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 11:26:41,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 11:26:41,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +56: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +12: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +56: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +56: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +42: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +42: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +42: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +27: [2023-04-29 11:26:41,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +36: [2023-04-29 11:26:41,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +11: [2023-04-29 11:26:41,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 11:26:41,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 11:26:41,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 11:26:41,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 11:26:41,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 7: [2023-04-29 11:26:41,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +44: [2023-04-29 11:26:41,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +27: [2023-04-29 11:26:41,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +27: [2023-04-29 11:26:41,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +44: [2023-04-29 11:26:41,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +57: [2023-04-29 11:26:41,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 11:26:41,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +21: [2023-04-29 11:26:41,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 11:26:41,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +21: [2023-04-29 11:26:41,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +49: [2023-04-29 11:26:41,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 11:26:41,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 11:26:41,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +55: [2023-04-29 11:26:41,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +12: [2023-04-29 11:26:41,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +22: [2023-04-29 11:26:41,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +49: [2023-04-29 11:26:41,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +45: [2023-04-29 11:26:41,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 11:26:41,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 11:26:41,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 11:26:41,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 4: [2023-04-29 11:26:41,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +12: [2023-04-29 11:26:41,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +58: [2023-04-29 11:26:41,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +12: [2023-04-29 11:26:41,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +12: [2023-04-29 11:26:41,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 4: [2023-04-29 11:26:41,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +58: [2023-04-29 11:26:41,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 11:26:41,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +12: [2023-04-29 11:26:41,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +12: [2023-04-29 11:26:41,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +12: [2023-04-29 11:26:41,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +58: [2023-04-29 11:26:41,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 11:26:41,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 11:26:41,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 11:26:41,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 11:26:41,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +49: [2023-04-29 11:26:41,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +49: [2023-04-29 11:26:41,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +40: [2023-04-29 11:26:41,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +18: [2023-04-29 11:26:41,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +42: [2023-04-29 11:26:41,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +56: [2023-04-29 11:26:41,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +29: [2023-04-29 11:26:41,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 11:26:41,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +52: [2023-04-29 11:26:41,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +17: [2023-04-29 11:26:41,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +45: [2023-04-29 11:26:41,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +20: [2023-04-29 11:26:41,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 0: [2023-04-29 11:26:41,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 11:26:41,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 11:26:41,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 11:26:41,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 11:26:41,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 11:26:41,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 11:26:41,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +52: [2023-04-29 11:26:41,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 11:26:41,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +15: [2023-04-29 11:26:41,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 11:26:41,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 11:26:41,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 11:26:41,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 11:26:41,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 11:26:41,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +24: [2023-04-29 11:26:41,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 11:26:41,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +20: [2023-04-29 11:26:41,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +11: [2023-04-29 11:26:41,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 11:26:41,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +24: [2023-04-29 11:26:41,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +58: [2023-04-29 11:26:41,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +11: [2023-04-29 11:26:41,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +17: [2023-04-29 11:26:41,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +58: [2023-04-29 11:26:41,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +58: [2023-04-29 11:26:41,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +52: [2023-04-29 11:26:41,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +11: [2023-04-29 11:26:41,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +58: [2023-04-29 11:26:41,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +44: [2023-04-29 11:26:41,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 11:26:41,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +49: [2023-04-29 11:26:41,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 11:26:41,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 11:26:41,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +17: [2023-04-29 11:26:41,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +52: [2023-04-29 11:26:41,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 11:26:41,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +58: [2023-04-29 11:26:41,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt... +40: [2023-04-29 11:26:41,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +18: [2023-04-29 11:26:41,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +18: [2023-04-29 11:26:41,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 11:26:41,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 11:26:41,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +15: [2023-04-29 11:26:41,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 11:26:41,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +21: [2023-04-29 11:26:41,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +41: [2023-04-29 11:26:41,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 11:26:41,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +29: [2023-04-29 11:26:41,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +40: [2023-04-29 11:26:41,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 11:26:41,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +31: [2023-04-29 11:26:41,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 11:26:41,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +31: [2023-04-29 11:26:41,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 11:26:41,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +49: [2023-04-29 11:26:41,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +29: [2023-04-29 11:26:41,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +29: [2023-04-29 11:26:41,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 11:26:41,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +22: [2023-04-29 11:26:41,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 11:26:41,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 11:26:41,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 11:26:41,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +13: [2023-04-29 11:26:41,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 11:26:41,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +17: [2023-04-29 11:26:41,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +55: [2023-04-29 11:26:41,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +41: [2023-04-29 11:26:41,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +29: [2023-04-29 11:26:41,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +55: [2023-04-29 11:26:41,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +55: [2023-04-29 11:26:41,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +57: [2023-04-29 11:26:41,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +57: [2023-04-29 11:26:41,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +20: [2023-04-29 11:26:41,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 11:26:41,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +41: [2023-04-29 11:26:41,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 11:26:41,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 11:26:41,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 11:26:41,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 11:26:41,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +37: [2023-04-29 11:26:41,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 11:26:41,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 11:26:41,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +49: [2023-04-29 11:26:41,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +22: [2023-04-29 11:26:41,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 11:26:41,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +45: [2023-04-29 11:26:41,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 11:26:41,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 11:26:41,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +55: [2023-04-29 11:26:41,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 11:26:41,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +23: [2023-04-29 11:26:41,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 11:26:41,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 11:26:41,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +22: [2023-04-29 11:26:41,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +20: [2023-04-29 11:26:41,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 11:26:41,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +37: [2023-04-29 11:26:41,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 11:26:41,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +37: [2023-04-29 11:26:41,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +21: [2023-04-29 11:26:41,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +21: [2023-04-29 11:26:41,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +55: [2023-04-29 11:26:41,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +21: [2023-04-29 11:26:41,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +55: [2023-04-29 11:26:41,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +55: [2023-04-29 11:26:41,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +55: [2023-04-29 11:26:41,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +44: [2023-04-29 11:26:41,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +55: [2023-04-29 11:26:41,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +55: [2023-04-29 11:26:41,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +55: [2023-04-29 11:26:41,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +57: [2023-04-29 11:26:41,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 11:26:41,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +56: [2023-04-29 11:26:41,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +13: [2023-04-29 11:26:41,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 11:26:41,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +18: [2023-04-29 11:26:41,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +57: [2023-04-29 11:26:41,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 11:26:41,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +23: [2023-04-29 11:26:41,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 11:26:41,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 11:26:41,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 11:26:41,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +56: [2023-04-29 11:26:41,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +18: [2023-04-29 11:26:41,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 11:26:41,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 11:26:41,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 11:26:41,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +18: [2023-04-29 11:26:41,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +18: [2023-04-29 11:26:41,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +55: [2023-04-29 11:26:41,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... + 9: [2023-04-29 11:26:41,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 1: [2023-04-29 11:26:41,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +41: [2023-04-29 11:26:41,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 11:26:41,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +46: [2023-04-29 11:26:41,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 11:26:41,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 11:26:41,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +40: [2023-04-29 11:26:41,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +46: [2023-04-29 11:26:41,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... + 1: [2023-04-29 11:26:41,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +13: [2023-04-29 11:26:41,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 11:26:41,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 11:26:41,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 11:26:41,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +40: [2023-04-29 11:26:41,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +31: [2023-04-29 11:26:41,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 11:26:41,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 11:26:41,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +41: [2023-04-29 11:26:41,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 11:26:41,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +22: [2023-04-29 11:26:41,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 11:26:41,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 11:26:41,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 11:26:41,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 11:26:41,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +46: [2023-04-29 11:26:41,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +14: [2023-04-29 11:26:41,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +46: [2023-04-29 11:26:41,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 11:26:41,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +40: [2023-04-29 11:26:41,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +40: [2023-04-29 11:26:41,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +40: [2023-04-29 11:26:41,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt... +17: [2023-04-29 11:26:41,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 11:26:41,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 11:26:41,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 11:26:41,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +20: [2023-04-29 11:26:41,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 11:26:41,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 11:26:41,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 11:26:41,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 11:26:41,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 11:26:41,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 11:26:41,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +20: [2023-04-29 11:26:41,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +56: [2023-04-29 11:26:41,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 11:26:41,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 11:26:41,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +17: [2023-04-29 11:26:41,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +48: [2023-04-29 11:26:41,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 11:26:41,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 11:26:41,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +42: [2023-04-29 11:26:41,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +11: [2023-04-29 11:26:41,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +10: [2023-04-29 11:26:41,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +12: [2023-04-29 11:26:41,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 11:26:41,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +56: [2023-04-29 11:26:41,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 11:26:41,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +23: [2023-04-29 11:26:41,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +55: [2023-04-29 11:26:41,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +49: [2023-04-29 11:26:41,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +49: [2023-04-29 11:26:41,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +20: [2023-04-29 11:26:41,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +48: [2023-04-29 11:26:41,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +48: [2023-04-29 11:26:41,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +10: [2023-04-29 11:26:41,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +12: [2023-04-29 11:26:41,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +12: [2023-04-29 11:26:41,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 11:26:41,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +58: [2023-04-29 11:26:41,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 11:26:41,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +55: [2023-04-29 11:26:41,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 11:26:41,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 11:26:41,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 11:26:41,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +58: [2023-04-29 11:26:41,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +58: [2023-04-29 11:26:41,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +29: [2023-04-29 11:26:41,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +14: [2023-04-29 11:26:41,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 11:26:41,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +48: [2023-04-29 11:26:41,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +48: [2023-04-29 11:26:41,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +29: [2023-04-29 11:26:41,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +29: [2023-04-29 11:26:41,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 11:26:41,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 11:26:41,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 11:26:41,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +12: [2023-04-29 11:26:41,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +12: [2023-04-29 11:26:41,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 11:26:41,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +49: [2023-04-29 11:26:41,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_00-model_states.pt. +12: [2023-04-29 11:26:41,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +12: [2023-04-29 11:26:41,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +49: [2023-04-29 11:26:41,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +14: [2023-04-29 11:26:41,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +48: [2023-04-29 11:26:41,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +48: [2023-04-29 11:26:41,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +28: [2023-04-29 11:26:41,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 11:26:41,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +58: [2023-04-29 11:26:41,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 11:26:41,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +49: [2023-04-29 11:26:41,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +49: [2023-04-29 11:26:41,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +58: [2023-04-29 11:26:41,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 11:26:41,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +28: [2023-04-29 11:26:41,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 11:26:41,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 11:26:41,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 11:26:41,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 11:26:41,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 11:26:41,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +11: [2023-04-29 11:26:41,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 11:26:41,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 11:26:41,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 11:26:41,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +28: [2023-04-29 11:26:41,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +11: [2023-04-29 11:26:41,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 11:26:41,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 11:26:41,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +11: [2023-04-29 11:26:41,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 11:26:41,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +28: [2023-04-29 11:26:41,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt... +28: [2023-04-29 11:26:41,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +28: [2023-04-29 11:26:41,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt... +29: [2023-04-29 11:26:41,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 11:26:41,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +49: [2023-04-29 11:26:41,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +32: [2023-04-29 11:26:41,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 11:26:41,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 11:26:41,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 11:26:41,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +39: [2023-04-29 11:26:41,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 11:26:41,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 11:26:41,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 11:26:41,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 11:26:41,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 11:26:41,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 11:26:41,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +32: [2023-04-29 11:26:41,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 11:26:41,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 11:26:41,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 11:26:41,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 11:26:41,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 11:26:41,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 11:26:41,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +51: [2023-04-29 11:26:41,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +51: [2023-04-29 11:26:41,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +51: [2023-04-29 11:26:41,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. + 4: [2023-04-29 11:26:41,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +51: [2023-04-29 11:26:41,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. + 4: [2023-04-29 11:26:41,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +61: [2023-04-29 11:26:41,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 11:26:41,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 11:26:41,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 11:26:41,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 11:26:41,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 11:26:41,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 11:26:41,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 11:26:41,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +28: [2023-04-29 11:26:41,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 11:26:41,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_00-model_states.pt. +28: [2023-04-29 11:26:41,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +61: [2023-04-29 11:26:41,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +61: [2023-04-29 11:26:41,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +61: [2023-04-29 11:26:41,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +61: [2023-04-29 11:26:41,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +51: [2023-04-29 11:26:41,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 11:26:41,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 11:26:41,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 11:26:41,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +28: [2023-04-29 11:26:41,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +51: [2023-04-29 11:26:41,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 11:26:41,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 11:26:41,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 11:26:41,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 11:26:41,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 11:26:41,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 11:26:41,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 11:26:41,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 11:26:41,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +32: [2023-04-29 11:26:41,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 11:26:41,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 11:26:41,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 11:26:41,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +28: [2023-04-29 11:26:41,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +39: [2023-04-29 11:26:41,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 11:26:41,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 11:26:41,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 11:26:41,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +16: [2023-04-29 11:26:41,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 11:26:41,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 11:26:41,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 11:26:41,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +61: [2023-04-29 11:26:41,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 11:26:41,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 11:26:41,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 11:26:41,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +16: [2023-04-29 11:26:41,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 11:26:41,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 11:26:41,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 11:26:41,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +39: [2023-04-29 11:26:41,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 11:26:41,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 11:26:41,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 11:26:41,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 11:26:41,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 11:26:41,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +19: [2023-04-29 11:26:41,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 11:26:41,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +61: [2023-04-29 11:26:41,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 11:26:41,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 11:26:41,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +19: [2023-04-29 11:26:41,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 11:26:41,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 11:26:41,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +19: [2023-04-29 11:26:41,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +39: [2023-04-29 11:26:41,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 11:26:41,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +34: [2023-04-29 11:26:41,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +51: [2023-04-29 11:26:41,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +19: [2023-04-29 11:26:41,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +19: [2023-04-29 11:26:41,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +34: [2023-04-29 11:26:41,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +34: [2023-04-29 11:26:41,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +61: [2023-04-29 11:26:41,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 11:26:41,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 11:26:41,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +61: [2023-04-29 11:26:41,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 11:26:41,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 11:26:41,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 11:26:41,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +51: [2023-04-29 11:26:41,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 11:26:41,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +51: [2023-04-29 11:26:41,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +51: [2023-04-29 11:26:41,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +30: [2023-04-29 11:26:41,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 11:26:41,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 11:26:41,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +60: [2023-04-29 11:26:41,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +60: [2023-04-29 11:26:41,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +51: [2023-04-29 11:26:41,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +30: [2023-04-29 11:26:41,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +51: [2023-04-29 11:26:41,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +60: [2023-04-29 11:26:41,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +60: [2023-04-29 11:26:41,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +30: [2023-04-29 11:26:41,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 11:26:41,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 11:26:41,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +61: [2023-04-29 11:26:41,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +30: [2023-04-29 11:26:41,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +61: [2023-04-29 11:26:41,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +50: [2023-04-29 11:26:41,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +50: [2023-04-29 11:26:41,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +16: [2023-04-29 11:26:41,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +50: [2023-04-29 11:26:41,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. + 3: [2023-04-29 11:26:41,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +50: [2023-04-29 11:26:41,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. + 5: [2023-04-29 11:26:41,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +61: [2023-04-29 11:26:41,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 11:26:41,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 11:26:41,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 11:26:41,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 11:26:41,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 11:26:41,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 11:26:41,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 11:26:41,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +61: [2023-04-29 11:26:41,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 5: [2023-04-29 11:26:41,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +51: [2023-04-29 11:26:41,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +61: [2023-04-29 11:26:41,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 11:26:41,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 11:26:41,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 11:26:41,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 11:26:41,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 11:26:41,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 11:26:41,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 11:26:41,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +46: [2023-04-29 11:26:41,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +46: [2023-04-29 11:26:41,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +46: [2023-04-29 11:26:41,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +61: [2023-04-29 11:26:41,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +16: [2023-04-29 11:26:41,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 11:26:41,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +51: [2023-04-29 11:26:41,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 11:26:41,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 11:26:41,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 11:26:41,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +60: [2023-04-29 11:26:41,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 11:26:41,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +60: [2023-04-29 11:26:41,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +16: [2023-04-29 11:26:41,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +61: [2023-04-29 11:26:41,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +61: [2023-04-29 11:26:41,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 11:26:41,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 11:26:41,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 11:26:41,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 11:26:41,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 11:26:41,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 11:26:41,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 11:26:41,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +32: [2023-04-29 11:26:41,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. + 8: [2023-04-29 11:26:41,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +61: [2023-04-29 11:26:41,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 11:26:41,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. + 8: [2023-04-29 11:26:41,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 11:26:41,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +54: [2023-04-29 11:26:41,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 11:26:41,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 11:26:41,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 11:26:41,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 11:26:41,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 11:26:41,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 11:26:41,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +34: [2023-04-29 11:26:41,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 11:26:41,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +16: [2023-04-29 11:26:41,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +54: [2023-04-29 11:26:41,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 11:26:41,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 11:26:41,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 11:26:41,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 11:26:41,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 11:26:41,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 11:26:41,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 11:26:41,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 11:26:41,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 11:26:41,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +38: [2023-04-29 11:26:41,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +38: [2023-04-29 11:26:41,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 11:26:41,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 11:26:41,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 11:26:41,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +43: [2023-04-29 11:26:41,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 11:26:41,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 11:26:41,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 11:26:41,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +60: [2023-04-29 11:26:41,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +60: [2023-04-29 11:26:41,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +19: [2023-04-29 11:26:41,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 11:26:41,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +38: [2023-04-29 11:26:41,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 11:26:41,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 11:26:41,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 11:26:41,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 11:26:41,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 11:26:41,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 11:26:41,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 11:26:41,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +16: [2023-04-29 11:26:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:41,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +46: [2023-04-29 11:26:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 11:26:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 11:26:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +43: [2023-04-29 11:26:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +43: [2023-04-29 11:26:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +43: [2023-04-29 11:26:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +43: [2023-04-29 11:26:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 11:26:41,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +19: [2023-04-29 11:26:41,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +52: [2023-04-29 11:26:41,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +52: [2023-04-29 11:26:41,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +52: [2023-04-29 11:26:41,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +16: [2023-04-29 11:26:41,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +52: [2023-04-29 11:26:41,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +32: [2023-04-29 11:26:41,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 11:26:41,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 11:26:41,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 11:26:41,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +30: [2023-04-29 11:26:41,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 11:26:41,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 11:26:41,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 11:26:41,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:41,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:41,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 11:26:41,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 11:26:41,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +26: [2023-04-29 11:26:41,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 11:26:41,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 11:26:41,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 11:26:41,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +52: [2023-04-29 11:26:41,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 11:26:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 11:26:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 11:26:41,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 11:26:41,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 11:26:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 11:26:41,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +34: [2023-04-29 11:26:41,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 11:26:41,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +26: [2023-04-29 11:26:41,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +53: [2023-04-29 11:26:41,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 11:26:41,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +34: [2023-04-29 11:26:41,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +34: [2023-04-29 11:26:41,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 3: [2023-04-29 11:26:41,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +53: [2023-04-29 11:26:41,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +19: [2023-04-29 11:26:41,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +19: [2023-04-29 11:26:41,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +19: [2023-04-29 11:26:41,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +19: [2023-04-29 11:26:41,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +53: [2023-04-29 11:26:41,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +60: [2023-04-29 11:26:41,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +53: [2023-04-29 11:26:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +53: [2023-04-29 11:26:41,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +53: [2023-04-29 11:26:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +30: [2023-04-29 11:26:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +53: [2023-04-29 11:26:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +59: [2023-04-29 11:26:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +59: [2023-04-29 11:26:41,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +30: [2023-04-29 11:26:41,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +62: [2023-04-29 11:26:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +62: [2023-04-29 11:26:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +62: [2023-04-29 11:26:41,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +62: [2023-04-29 11:26:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +63: [2023-04-29 11:26:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 11:26:41,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +30: [2023-04-29 11:26:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +60: [2023-04-29 11:26:41,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +30: [2023-04-29 11:26:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +59: [2023-04-29 11:26:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +59: [2023-04-29 11:26:41,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. + 3: [2023-04-29 11:26:41,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +34: [2023-04-29 11:26:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 11:26:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 11:26:41,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 11:26:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 11:26:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +33: [2023-04-29 11:26:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +63: [2023-04-29 11:26:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 11:26:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +50: [2023-04-29 11:26:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 11:26:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 11:26:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 11:26:41,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 11:26:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +34: [2023-04-29 11:26:41,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 11:26:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 11:26:41,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 11:26:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 11:26:41,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 11:26:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 11:26:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +60: [2023-04-29 11:26:41,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 11:26:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 11:26:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 11:26:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 11:26:41,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +50: [2023-04-29 11:26:41,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 11:26:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 11:26:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +43: [2023-04-29 11:26:41,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +43: [2023-04-29 11:26:41,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +43: [2023-04-29 11:26:41,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +43: [2023-04-29 11:26:41,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +53: [2023-04-29 11:26:41,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 11:26:41,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 11:26:41,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +38: [2023-04-29 11:26:41,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +19: [2023-04-29 11:26:41,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +50: [2023-04-29 11:26:41,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +50: [2023-04-29 11:26:41,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +43: [2023-04-29 11:26:41,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:41,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +19: [2023-04-29 11:26:41,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +36: [2023-04-29 11:26:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 11:26:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 11:26:41,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +36: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +54: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +38: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +38: [2023-04-29 11:26:41,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 11:26:41,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 11:26:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 11:26:41,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +26: [2023-04-29 11:26:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +26: [2023-04-29 11:26:41,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 5: [2023-04-29 11:26:41,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +26: [2023-04-29 11:26:41,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +26: [2023-04-29 11:26:41,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +54: [2023-04-29 11:26:41,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +62: [2023-04-29 11:26:41,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 11:26:41,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 11:26:41,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 11:26:41,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +50: [2023-04-29 11:26:41,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +50: [2023-04-29 11:26:41,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +36: [2023-04-29 11:26:41,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 11:26:41,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 11:26:41,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +36: [2023-04-29 11:26:41,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 11:26:41,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +60: [2023-04-29 11:26:41,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 11:26:41,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 11:26:41,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 11:26:41,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 11:26:41,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 11:26:41,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +53: [2023-04-29 11:26:41,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 11:26:41,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 11:26:41,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 11:26:41,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +30: [2023-04-29 11:26:41,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +30: [2023-04-29 11:26:41,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +62: [2023-04-29 11:26:41,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +30: [2023-04-29 11:26:41,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +53: [2023-04-29 11:26:41,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 11:26:41,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +30: [2023-04-29 11:26:41,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +59: [2023-04-29 11:26:41,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 11:26:41,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 11:26:41,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 11:26:41,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 11:26:41,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +34: [2023-04-29 11:26:41,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 11:26:41,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 11:26:41,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 11:26:41,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +60: [2023-04-29 11:26:41,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 11:26:41,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 11:26:41,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 11:26:41,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 11:26:41,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 11:26:41,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +27: [2023-04-29 11:26:41,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 11:26:41,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 11:26:41,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +62: [2023-04-29 11:26:41,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +27: [2023-04-29 11:26:41,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +32: [2023-04-29 11:26:41,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 7: [2023-04-29 11:26:41,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +38: [2023-04-29 11:26:41,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +27: [2023-04-29 11:26:41,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +54: [2023-04-29 11:26:41,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 11:26:41,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 11:26:41,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +38: [2023-04-29 11:26:41,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 11:26:41,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 11:26:41,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 11:26:41,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 11:26:41,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 11:26:41,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 11:26:41,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +27: [2023-04-29 11:26:41,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +27: [2023-04-29 11:26:41,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +43: [2023-04-29 11:26:41,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 11:26:41,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +27: [2023-04-29 11:26:41,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +38: [2023-04-29 11:26:41,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 11:26:41,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 11:26:41,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +60: [2023-04-29 11:26:41,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 11:26:41,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +43: [2023-04-29 11:26:41,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 11:26:41,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 11:26:41,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 11:26:41,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +32: [2023-04-29 11:26:41,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +32: [2023-04-29 11:26:41,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +43: [2023-04-29 11:26:41,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +26: [2023-04-29 11:26:41,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +54: [2023-04-29 11:26:41,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +26: [2023-04-29 11:26:41,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +54: [2023-04-29 11:26:41,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +54: [2023-04-29 11:26:41,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +26: [2023-04-29 11:26:41,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 11:26:41,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +34: [2023-04-29 11:26:41,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +26: [2023-04-29 11:26:41,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 11:26:41,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +60: [2023-04-29 11:26:41,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 11:26:41,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +30: [2023-04-29 11:26:41,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +32: [2023-04-29 11:26:41,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +30: [2023-04-29 11:26:41,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 11:26:41,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +39: [2023-04-29 11:26:41,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +39: [2023-04-29 11:26:41,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +39: [2023-04-29 11:26:41,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +39: [2023-04-29 11:26:41,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +30: [2023-04-29 11:26:41,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 11:26:41,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 11:26:41,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +62: [2023-04-29 11:26:41,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 11:26:41,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 11:26:41,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 11:26:41,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 11:26:41,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 11:26:41,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 11:26:41,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 11:26:41,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 11:26:41,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 11:26:41,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 11:26:41,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 0: [2023-04-29 11:26:41,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +63: [2023-04-29 11:26:41,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 0: [2023-04-29 11:26:41,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +63: [2023-04-29 11:26:41,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 11:26:41,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 11:26:41,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 11:26:41,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +24: [2023-04-29 11:26:41,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +24: [2023-04-29 11:26:41,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +24: [2023-04-29 11:26:41,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +24: [2023-04-29 11:26:41,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +19: [2023-04-29 11:26:41,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +37: [2023-04-29 11:26:41,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +37: [2023-04-29 11:26:41,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +37: [2023-04-29 11:26:41,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +37: [2023-04-29 11:26:41,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +57: [2023-04-29 11:26:41,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 11:26:41,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 11:26:41,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 11:26:41,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 11:26:41,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +57: [2023-04-29 11:26:41,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 11:26:41,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +19: [2023-04-29 11:26:41,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 7: [2023-04-29 11:26:41,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +47: [2023-04-29 11:26:41,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 11:26:41,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 11:26:41,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +26: [2023-04-29 11:26:41,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +57: [2023-04-29 11:26:41,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +26: [2023-04-29 11:26:41,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:41,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 11:26:41,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:41,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 11:26:41,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +47: [2023-04-29 11:26:41,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 11:26:41,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +19: [2023-04-29 11:26:41,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +19: [2023-04-29 11:26:41,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +47: [2023-04-29 11:26:41,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 11:26:41,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 11:26:41,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 9: [2023-04-29 11:26:41,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 8: [2023-04-29 11:26:41,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 8: [2023-04-29 11:26:41,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +26: [2023-04-29 11:26:41,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:41,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +39: [2023-04-29 11:26:41,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 11:26:41,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 5: [2023-04-29 11:26:41,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 5: [2023-04-29 11:26:41,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +39: [2023-04-29 11:26:41,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +47: [2023-04-29 11:26:41,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 11:26:41,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 11:26:41,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 11:26:41,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +50: [2023-04-29 11:26:41,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 11:26:41,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 11:26:41,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 11:26:41,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 11:26:41,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 11:26:41,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 11:26:41,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +53: [2023-04-29 11:26:41,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 11:26:41,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 11:26:41,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 11:26:41,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 0: [2023-04-29 11:26:41,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +59: [2023-04-29 11:26:41,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +27: [2023-04-29 11:26:41,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +63: [2023-04-29 11:26:41,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 11:26:41,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 9: [2023-04-29 11:26:41,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +62: [2023-04-29 11:26:41,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +59: [2023-04-29 11:26:41,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +59: [2023-04-29 11:26:41,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +53: [2023-04-29 11:26:41,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 11:26:41,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +24: [2023-04-29 11:26:41,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +53: [2023-04-29 11:26:41,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +53: [2023-04-29 11:26:41,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +53: [2023-04-29 11:26:41,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +24: [2023-04-29 11:26:41,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 11:26:41,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +59: [2023-04-29 11:26:41,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +37: [2023-04-29 11:26:41,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 11:26:41,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +37: [2023-04-29 11:26:41,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 6: [2023-04-29 11:26:41,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 6: [2023-04-29 11:26:41,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 6: [2023-04-29 11:26:41,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +33: [2023-04-29 11:26:41,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 11:26:41,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 11:26:41,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 11:26:41,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 11:26:41,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +62: [2023-04-29 11:26:41,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +23: [2023-04-29 11:26:41,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +23: [2023-04-29 11:26:41,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +23: [2023-04-29 11:26:41,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +23: [2023-04-29 11:26:41,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +62: [2023-04-29 11:26:41,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 11:26:41,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 11:26:41,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +27: [2023-04-29 11:26:41,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 11:26:41,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 11:26:41,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +43: [2023-04-29 11:26:41,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 11:26:41,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 11:26:41,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 11:26:41,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 11:26:41,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +37: [2023-04-29 11:26:41,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 11:26:41,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 11:26:41,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +62: [2023-04-29 11:26:41,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 11:26:41,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 11:26:41,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 11:26:41,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 11:26:41,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +33: [2023-04-29 11:26:41,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +33: [2023-04-29 11:26:41,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +37: [2023-04-29 11:26:41,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 11:26:41,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +62: [2023-04-29 11:26:41,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +62: [2023-04-29 11:26:41,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +48: [2023-04-29 11:26:41,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +48: [2023-04-29 11:26:41,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +48: [2023-04-29 11:26:41,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +43: [2023-04-29 11:26:41,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +43: [2023-04-29 11:26:41,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +59: [2023-04-29 11:26:41,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 11:26:41,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +43: [2023-04-29 11:26:41,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +43: [2023-04-29 11:26:41,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +22: [2023-04-29 11:26:41,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 11:26:41,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +62: [2023-04-29 11:26:41,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +54: [2023-04-29 11:26:41,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +33: [2023-04-29 11:26:41,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 2: [2023-04-29 11:26:41,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +37: [2023-04-29 11:26:41,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +37: [2023-04-29 11:26:41,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +43: [2023-04-29 11:26:41,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +43: [2023-04-29 11:26:41,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +41: [2023-04-29 11:26:41,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +41: [2023-04-29 11:26:41,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +41: [2023-04-29 11:26:41,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +22: [2023-04-29 11:26:41,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 11:26:41,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +54: [2023-04-29 11:26:41,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 11:26:41,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +33: [2023-04-29 11:26:41,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 2: [2023-04-29 11:26:41,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 11:26:41,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +54: [2023-04-29 11:26:41,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 11:26:41,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 5: [2023-04-29 11:26:41,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 11:26:41,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 11:26:41,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +54: [2023-04-29 11:26:41,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 11:26:41,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +36: [2023-04-29 11:26:41,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 11:26:41,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 11:26:41,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +59: [2023-04-29 11:26:41,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 8: [2023-04-29 11:26:41,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 11:26:41,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +44: [2023-04-29 11:26:41,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 11:26:41,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 11:26:41,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 11:26:41,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +54: [2023-04-29 11:26:41,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 5: [2023-04-29 11:26:41,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 11:26:41,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 11:26:41,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +54: [2023-04-29 11:26:41,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 9: [2023-04-29 11:26:41,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +27: [2023-04-29 11:26:41,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +36: [2023-04-29 11:26:41,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +36: [2023-04-29 11:26:41,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +22: [2023-04-29 11:26:41,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 11:26:41,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 11:26:41,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +54: [2023-04-29 11:26:41,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 7: [2023-04-29 11:26:41,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +44: [2023-04-29 11:26:41,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 11:26:41,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +30: [2023-04-29 11:26:41,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +38: [2023-04-29 11:26:41,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +38: [2023-04-29 11:26:41,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +30: [2023-04-29 11:26:41,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +38: [2023-04-29 11:26:41,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +50: [2023-04-29 11:26:41,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 11:26:41,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +38: [2023-04-29 11:26:41,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +31: [2023-04-29 11:26:41,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 11:26:41,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 0: [2023-04-29 11:26:41,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +44: [2023-04-29 11:26:41,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 11:26:41,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 11:26:41,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +30: [2023-04-29 11:26:41,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +33: [2023-04-29 11:26:41,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 11:26:41,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +30: [2023-04-29 11:26:41,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +26: [2023-04-29 11:26:41,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 11:26:41,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +31: [2023-04-29 11:26:41,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 11:26:41,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 11:26:41,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 11:26:41,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 11:26:41,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +52: [2023-04-29 11:26:41,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 11:26:41,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 11:26:41,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 11:26:41,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 11:26:41,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 11:26:41,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 11:26:41,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +52: [2023-04-29 11:26:41,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 11:26:41,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +27: [2023-04-29 11:26:41,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +33: [2023-04-29 11:26:41,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +50: [2023-04-29 11:26:41,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +48: [2023-04-29 11:26:41,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +48: [2023-04-29 11:26:41,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +10: [2023-04-29 11:26:41,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 11:26:41,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 11:26:41,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 11:26:41,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +18: [2023-04-29 11:26:41,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +15: [2023-04-29 11:26:41,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +15: [2023-04-29 11:26:41,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +15: [2023-04-29 11:26:41,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +10: [2023-04-29 11:26:41,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +48: [2023-04-29 11:26:41,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +18: [2023-04-29 11:26:41,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +15: [2023-04-29 11:26:41,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +18: [2023-04-29 11:26:41,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +27: [2023-04-29 11:26:41,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +27: [2023-04-29 11:26:41,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 11:26:41,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +26: [2023-04-29 11:26:41,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 4: [2023-04-29 11:26:41,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +50: [2023-04-29 11:26:41,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +52: [2023-04-29 11:26:41,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 11:26:41,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 11:26:41,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +52: [2023-04-29 11:26:41,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +52: [2023-04-29 11:26:41,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +52: [2023-04-29 11:26:41,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 11:26:41,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +26: [2023-04-29 11:26:41,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +57: [2023-04-29 11:26:41,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 11:26:41,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +59: [2023-04-29 11:26:41,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 11:26:41,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +26: [2023-04-29 11:26:41,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +59: [2023-04-29 11:26:41,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 11:26:41,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 11:26:41,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +59: [2023-04-29 11:26:41,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +11: [2023-04-29 11:26:41,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +11: [2023-04-29 11:26:41,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +11: [2023-04-29 11:26:41,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +10: [2023-04-29 11:26:41,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 11:26:41,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +33: [2023-04-29 11:26:41,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +41: [2023-04-29 11:26:41,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 11:26:41,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 11:26:41,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 11:26:41,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +59: [2023-04-29 11:26:41,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +10: [2023-04-29 11:26:41,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +57: [2023-04-29 11:26:41,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +26: [2023-04-29 11:26:41,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +41: [2023-04-29 11:26:41,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +33: [2023-04-29 11:26:41,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 11:26:41,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +12: [2023-04-29 11:26:41,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +12: [2023-04-29 11:26:41,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +12: [2023-04-29 11:26:41,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +12: [2023-04-29 11:26:41,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +38: [2023-04-29 11:26:41,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 11:26:41,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 11:26:41,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +38: [2023-04-29 11:26:41,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 11:26:41,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 11:26:41,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 2: [2023-04-29 11:26:41,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 2: [2023-04-29 11:26:41,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 2: [2023-04-29 11:26:41,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +39: [2023-04-29 11:26:41,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 11:26:41,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +47: [2023-04-29 11:26:41,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 11:26:41,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +13: [2023-04-29 11:26:41,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 11:26:41,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 11:26:41,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 11:26:41,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 11:26:41,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 11:26:41,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +33: [2023-04-29 11:26:41,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +25: [2023-04-29 11:26:41,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 11:26:41,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +18: [2023-04-29 11:26:41,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 11:26:41,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 11:26:41,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +39: [2023-04-29 11:26:41,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +39: [2023-04-29 11:26:41,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +18: [2023-04-29 11:26:41,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +18: [2023-04-29 11:26:41,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +39: [2023-04-29 11:26:41,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 11:26:41,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 11:26:41,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 11:26:41,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +13: [2023-04-29 11:26:41,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 11:26:41,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 11:26:41,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 11:26:41,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 11:26:41,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 11:26:41,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 11:26:41,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 11:26:41,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 11:26:41,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +55: [2023-04-29 11:26:41,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 11:26:41,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 11:26:41,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 11:26:41,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +11: [2023-04-29 11:26:41,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +55: [2023-04-29 11:26:41,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +25: [2023-04-29 11:26:41,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +25: [2023-04-29 11:26:41,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 11:26:41,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +25: [2023-04-29 11:26:41,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +22: [2023-04-29 11:26:41,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +22: [2023-04-29 11:26:41,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +37: [2023-04-29 11:26:41,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 11:26:41,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 11:26:41,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +33: [2023-04-29 11:26:41,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 11:26:41,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +33: [2023-04-29 11:26:41,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +11: [2023-04-29 11:26:41,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 11:26:41,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +22: [2023-04-29 11:26:41,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +12: [2023-04-29 11:26:41,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 11:26:41,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 11:26:41,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +25: [2023-04-29 11:26:41,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +22: [2023-04-29 11:26:41,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +25: [2023-04-29 11:26:41,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +55: [2023-04-29 11:26:41,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +11: [2023-04-29 11:26:41,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +37: [2023-04-29 11:26:41,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +57: [2023-04-29 11:26:41,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +55: [2023-04-29 11:26:41,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 11:26:41,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +28: [2023-04-29 11:26:41,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +28: [2023-04-29 11:26:41,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +12: [2023-04-29 11:26:41,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 11:26:41,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +12: [2023-04-29 11:26:41,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +12: [2023-04-29 11:26:41,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 11:26:41,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 11:26:41,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +28: [2023-04-29 11:26:41,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +28: [2023-04-29 11:26:41,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +57: [2023-04-29 11:26:41,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +47: [2023-04-29 11:26:41,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +42: [2023-04-29 11:26:41,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 11:26:41,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 11:26:41,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +39: [2023-04-29 11:26:41,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 11:26:41,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 11:26:41,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +58: [2023-04-29 11:26:41,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +39: [2023-04-29 11:26:41,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 11:26:41,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +47: [2023-04-29 11:26:41,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +42: [2023-04-29 11:26:41,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 11:26:41,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +58: [2023-04-29 11:26:41,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +58: [2023-04-29 11:26:41,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. + 7: [2023-04-29 11:26:41,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +58: [2023-04-29 11:26:41,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +58: [2023-04-29 11:26:41,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 11:26:41,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. + 5: [2023-04-29 11:26:41,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +57: [2023-04-29 11:26:41,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +57: [2023-04-29 11:26:41,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. + 5: [2023-04-29 11:26:41,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +20: [2023-04-29 11:26:41,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +57: [2023-04-29 11:26:41,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. + 0: [2023-04-29 11:26:41,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +20: [2023-04-29 11:26:41,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +20: [2023-04-29 11:26:41,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +15: [2023-04-29 11:26:41,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 11:26:41,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 11:26:41,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +15: [2023-04-29 11:26:41,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 11:26:41,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +39: [2023-04-29 11:26:41,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 11:26:41,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 7: [2023-04-29 11:26:41,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 8: [2023-04-29 11:26:41,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +37: [2023-04-29 11:26:41,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +39: [2023-04-29 11:26:41,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +44: [2023-04-29 11:26:41,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 11:26:41,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +35: [2023-04-29 11:26:41,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +39: [2023-04-29 11:26:41,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 11:26:41,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +35: [2023-04-29 11:26:41,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. + 2: [2023-04-29 11:26:41,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +58: [2023-04-29 11:26:41,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +37: [2023-04-29 11:26:41,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 11:26:41,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 11:26:41,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +58: [2023-04-29 11:26:41,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 11:26:41,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +63: [2023-04-29 11:26:41,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +63: [2023-04-29 11:26:41,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +63: [2023-04-29 11:26:41,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +63: [2023-04-29 11:26:41,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. + 2: [2023-04-29 11:26:41,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 11:26:41,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 11:26:41,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +47: [2023-04-29 11:26:41,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 11:26:41,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 11:26:41,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +58: [2023-04-29 11:26:41,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 11:26:41,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 11:26:41,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 11:26:41,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 2: [2023-04-29 11:26:41,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 11:26:41,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 11:26:41,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 11:26:41,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +37: [2023-04-29 11:26:41,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +37: [2023-04-29 11:26:41,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 11:26:41,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +37: [2023-04-29 11:26:41,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +44: [2023-04-29 11:26:41,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +58: [2023-04-29 11:26:41,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 11:26:41,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 11:26:41,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 11:26:41,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 11:26:41,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 11:26:41,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 11:26:41,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +58: [2023-04-29 11:26:41,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +22: [2023-04-29 11:26:41,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 11:26:41,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 11:26:41,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 11:26:41,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +52: [2023-04-29 11:26:41,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 11:26:41,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 11:26:41,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 11:26:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +31: [2023-04-29 11:26:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +31: [2023-04-29 11:26:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +37: [2023-04-29 11:26:41,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +37: [2023-04-29 11:26:41,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +25: [2023-04-29 11:26:41,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +18: [2023-04-29 11:26:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 11:26:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 11:26:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 4: [2023-04-29 11:26:41,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 11:26:41,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +21: [2023-04-29 11:26:41,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +31: [2023-04-29 11:26:41,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +12: [2023-04-29 11:26:41,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +12: [2023-04-29 11:26:41,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 11:26:41,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 11:26:41,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +12: [2023-04-29 11:26:41,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +21: [2023-04-29 11:26:41,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +12: [2023-04-29 11:26:41,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +21: [2023-04-29 11:26:41,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +21: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +10: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 6: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +10: [2023-04-29 11:26:41,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +28: [2023-04-29 11:26:41,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 11:26:41,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 8: [2023-04-29 11:26:41,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +28: [2023-04-29 11:26:41,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 11:26:41,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +52: [2023-04-29 11:26:41,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +24: [2023-04-29 11:26:41,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +24: [2023-04-29 11:26:41,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 11:26:41,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 11:26:41,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +24: [2023-04-29 11:26:41,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 11:26:41,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 11:26:41,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +24: [2023-04-29 11:26:41,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 11:26:41,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +18: [2023-04-29 11:26:41,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 11:26:41,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 11:26:41,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +52: [2023-04-29 11:26:41,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +22: [2023-04-29 11:26:41,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +52: [2023-04-29 11:26:41,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 11:26:41,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 11:26:41,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 8: [2023-04-29 11:26:41,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 4: [2023-04-29 11:26:41,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 11:26:41,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 11:26:41,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 11:26:41,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 11:26:41,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 11:26:41,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 11:26:41,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 11:26:41,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +16: [2023-04-29 11:26:41,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 11:26:41,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +49: [2023-04-29 11:26:41,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 11:26:41,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 11:26:41,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 11:26:41,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +24: [2023-04-29 11:26:41,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +21: [2023-04-29 11:26:41,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +49: [2023-04-29 11:26:41,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +24: [2023-04-29 11:26:41,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 11:26:41,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +44: [2023-04-29 11:26:41,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 6: [2023-04-29 11:26:41,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 6: [2023-04-29 11:26:41,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 6: [2023-04-29 11:26:41,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +20: [2023-04-29 11:26:41,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +21: [2023-04-29 11:26:41,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +21: [2023-04-29 11:26:41,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 11:26:41,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +38: [2023-04-29 11:26:41,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +24: [2023-04-29 11:26:41,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +24: [2023-04-29 11:26:41,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +24: [2023-04-29 11:26:41,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +24: [2023-04-29 11:26:41,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 9: [2023-04-29 11:26:41,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +49: [2023-04-29 11:26:41,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +24: [2023-04-29 11:26:41,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +44: [2023-04-29 11:26:41,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 11:26:41,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +16: [2023-04-29 11:26:41,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 11:26:41,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +40: [2023-04-29 11:26:41,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +57: [2023-04-29 11:26:41,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 11:26:41,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 11:26:41,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +40: [2023-04-29 11:26:41,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +16: [2023-04-29 11:26:41,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +40: [2023-04-29 11:26:41,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +49: [2023-04-29 11:26:41,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +57: [2023-04-29 11:26:41,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +49: [2023-04-29 11:26:41,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +57: [2023-04-29 11:26:41,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 11:26:41,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 0: [2023-04-29 11:26:41,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +49: [2023-04-29 11:26:41,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +38: [2023-04-29 11:26:41,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 8: [2023-04-29 11:26:41,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +63: [2023-04-29 11:26:41,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 11:26:41,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +20: [2023-04-29 11:26:41,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +37: [2023-04-29 11:26:41,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +37: [2023-04-29 11:26:41,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 11:26:41,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 11:26:41,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 11:26:41,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +29: [2023-04-29 11:26:41,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +38: [2023-04-29 11:26:41,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 11:26:41,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +29: [2023-04-29 11:26:41,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +52: [2023-04-29 11:26:41,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +29: [2023-04-29 11:26:41,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +29: [2023-04-29 11:26:41,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 11:26:41,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 9: [2023-04-29 11:26:41,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 0: [2023-04-29 11:26:41,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 11:26:41,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 11:26:41,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +44: [2023-04-29 11:26:41,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 11:26:41,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +10: [2023-04-29 11:26:41,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 11:26:41,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 11:26:41,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +16: [2023-04-29 11:26:41,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +63: [2023-04-29 11:26:41,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +56: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +56: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 11:26:41,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 11:26:41,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 11:26:41,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +31: [2023-04-29 11:26:41,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 11:26:41,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:41,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 11:26:41,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 11:26:41,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +35: [2023-04-29 11:26:41,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 11:26:41,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 11:26:41,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +38: [2023-04-29 11:26:41,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +35: [2023-04-29 11:26:41,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +13: [2023-04-29 11:26:41,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 11:26:41,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 11:26:41,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 11:26:41,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 11:26:41,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 11:26:41,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +61: [2023-04-29 11:26:41,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 11:26:41,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 11:26:41,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +38: [2023-04-29 11:26:41,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +61: [2023-04-29 11:26:41,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +29: [2023-04-29 11:26:41,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +20: [2023-04-29 11:26:41,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 11:26:41,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +22: [2023-04-29 11:26:41,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 11:26:41,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 11:26:41,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 11:26:41,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 11:26:41,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 11:26:41,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 11:26:41,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +29: [2023-04-29 11:26:41,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +29: [2023-04-29 11:26:41,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +18: [2023-04-29 11:26:41,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +52: [2023-04-29 11:26:41,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +21: [2023-04-29 11:26:41,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +21: [2023-04-29 11:26:41,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 11:26:41,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +19: [2023-04-29 11:26:41,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 11:26:41,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +52: [2023-04-29 11:26:41,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 11:26:41,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 11:26:41,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +46: [2023-04-29 11:26:41,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +46: [2023-04-29 11:26:41,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +52: [2023-04-29 11:26:41,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +16: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +48: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +21: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +46: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +31: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +46: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +48: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +10: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +46: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +48: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +44: [2023-04-29 11:26:41,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +44: [2023-04-29 11:26:41,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +31: [2023-04-29 11:26:41,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +48: [2023-04-29 11:26:41,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 11:26:41,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +31: [2023-04-29 11:26:41,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 11:26:41,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:41,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 11:26:41,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 11:26:41,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 11:26:41,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 11:26:41,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 11:26:41,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +61: [2023-04-29 11:26:41,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +15: [2023-04-29 11:26:41,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +13: [2023-04-29 11:26:41,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 11:26:41,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 11:26:41,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 11:26:41,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 11:26:41,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 11:26:41,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 11:26:41,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 11:26:41,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 11:26:41,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +19: [2023-04-29 11:26:41,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 11:26:41,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 11:26:41,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 11:26:41,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +39: [2023-04-29 11:26:41,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +11: [2023-04-29 11:26:41,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 11:26:41,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +19: [2023-04-29 11:26:41,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +48: [2023-04-29 11:26:41,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +48: [2023-04-29 11:26:41,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +48: [2023-04-29 11:26:41,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 11:26:41,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 11:26:41,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +48: [2023-04-29 11:26:41,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +42: [2023-04-29 11:26:41,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +19: [2023-04-29 11:26:41,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +10: [2023-04-29 11:26:41,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 11:26:41,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 11:26:41,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 11:26:41,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +48: [2023-04-29 11:26:41,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +48: [2023-04-29 11:26:41,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +22: [2023-04-29 11:26:41,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +12: [2023-04-29 11:26:41,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +48: [2023-04-29 11:26:41,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +47: [2023-04-29 11:26:41,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +47: [2023-04-29 11:26:41,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +47: [2023-04-29 11:26:41,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +10: [2023-04-29 11:26:41,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +10: [2023-04-29 11:26:41,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +18: [2023-04-29 11:26:41,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +47: [2023-04-29 11:26:41,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +22: [2023-04-29 11:26:41,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +11: [2023-04-29 11:26:41,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +15: [2023-04-29 11:26:41,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 11:26:41,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 0: [2023-04-29 11:26:41,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +39: [2023-04-29 11:26:41,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +25: [2023-04-29 11:26:41,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 11:26:41,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 11:26:41,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +55: [2023-04-29 11:26:41,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +18: [2023-04-29 11:26:41,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +18: [2023-04-29 11:26:41,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 0: [2023-04-29 11:26:41,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +40: [2023-04-29 11:26:41,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +15: [2023-04-29 11:26:41,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +39: [2023-04-29 11:26:41,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +11: [2023-04-29 11:26:41,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 11:26:41,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +11: [2023-04-29 11:26:41,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +40: [2023-04-29 11:26:41,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 11:26:41,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +30: [2023-04-29 11:26:41,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 11:26:41,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 11:26:41,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +42: [2023-04-29 11:26:41,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +30: [2023-04-29 11:26:41,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 11:26:41,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +12: [2023-04-29 11:26:41,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 11:26:41,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +55: [2023-04-29 11:26:41,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 11:26:41,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 11:26:41,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 11:26:41,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 11:26:41,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 11:26:41,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +13: [2023-04-29 11:26:41,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +41: [2023-04-29 11:26:41,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 11:26:41,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 11:26:41,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 11:26:41,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 11:26:41,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 11:26:41,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +12: [2023-04-29 11:26:41,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 11:26:41,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 11:26:41,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 11:26:41,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +16: [2023-04-29 11:26:41,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +45: [2023-04-29 11:26:41,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 11:26:41,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 11:26:41,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +30: [2023-04-29 11:26:41,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 11:26:41,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +30: [2023-04-29 11:26:41,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 11:26:41,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 11:26:41,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +36: [2023-04-29 11:26:41,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +36: [2023-04-29 11:26:41,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +15: [2023-04-29 11:26:41,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 11:26:41,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 11:26:41,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +56: [2023-04-29 11:26:41,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +56: [2023-04-29 11:26:41,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +11: [2023-04-29 11:26:41,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 11:26:41,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 11:26:41,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +51: [2023-04-29 11:26:41,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +51: [2023-04-29 11:26:41,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +41: [2023-04-29 11:26:41,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 11:26:41,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 11:26:41,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 11:26:41,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +41: [2023-04-29 11:26:41,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +51: [2023-04-29 11:26:41,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +39: [2023-04-29 11:26:41,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 11:26:41,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +56: [2023-04-29 11:26:41,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +56: [2023-04-29 11:26:41,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +45: [2023-04-29 11:26:41,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 11:26:41,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +29: [2023-04-29 11:26:41,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +41: [2023-04-29 11:26:41,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +12: [2023-04-29 11:26:41,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +10: [2023-04-29 11:26:41,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 11:26:41,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +45: [2023-04-29 11:26:41,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +45: [2023-04-29 11:26:41,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +29: [2023-04-29 11:26:41,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +41: [2023-04-29 11:26:41,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +16: [2023-04-29 11:26:41,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 11:26:41,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +36: [2023-04-29 11:26:41,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +41: [2023-04-29 11:26:41,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 11:26:41,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +29: [2023-04-29 11:26:41,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +45: [2023-04-29 11:26:41,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 11:26:41,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 11:26:41,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +13: [2023-04-29 11:26:41,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 11:26:41,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +45: [2023-04-29 11:26:41,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +16: [2023-04-29 11:26:41,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 11:26:41,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 11:26:41,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 11:26:41,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +23: [2023-04-29 11:26:41,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 11:26:41,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 11:26:41,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +42: [2023-04-29 11:26:41,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +42: [2023-04-29 11:26:41,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +29: [2023-04-29 11:26:41,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 11:26:41,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +42: [2023-04-29 11:26:41,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 11:26:41,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 11:26:41,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +45: [2023-04-29 11:26:41,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +44: [2023-04-29 11:26:41,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +23: [2023-04-29 11:26:41,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 11:26:41,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 11:26:41,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 11:26:41,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +44: [2023-04-29 11:26:41,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +11: [2023-04-29 11:26:41,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +23: [2023-04-29 11:26:41,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +42: [2023-04-29 11:26:41,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +11: [2023-04-29 11:26:41,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +39: [2023-04-29 11:26:41,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +11: [2023-04-29 11:26:41,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +12: [2023-04-29 11:26:41,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 11:26:41,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +47: [2023-04-29 11:26:41,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +47: [2023-04-29 11:26:41,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 11:26:41,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +55: [2023-04-29 11:26:41,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +55: [2023-04-29 11:26:41,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +15: [2023-04-29 11:26:41,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +14: [2023-04-29 11:26:41,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +14: [2023-04-29 11:26:41,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +15: [2023-04-29 11:26:41,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 11:26:41,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +23: [2023-04-29 11:26:41,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +23: [2023-04-29 11:26:41,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +55: [2023-04-29 11:26:41,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +23: [2023-04-29 11:26:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 11:26:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +55: [2023-04-29 11:26:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +25: [2023-04-29 11:26:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 11:26:41,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 11:26:41,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 11:26:41,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +18: [2023-04-29 11:26:41,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +49: [2023-04-29 11:26:41,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +24: [2023-04-29 11:26:41,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +47: [2023-04-29 11:26:41,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +23: [2023-04-29 11:26:41,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 11:26:41,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 11:26:41,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +14: [2023-04-29 11:26:41,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +57: [2023-04-29 11:26:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +23: [2023-04-29 11:26:41,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 11:26:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 11:26:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 11:26:41,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 11:26:41,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +39: [2023-04-29 11:26:41,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 11:26:41,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +14: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +28: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +12: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 11:26:41,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +55: [2023-04-29 11:26:41,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +12: [2023-04-29 11:26:41,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +58: [2023-04-29 11:26:41,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +17: [2023-04-29 11:26:41,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 11:26:41,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 11:26:41,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +22: [2023-04-29 11:26:41,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 11:26:41,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 11:26:41,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +24: [2023-04-29 11:26:41,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +24: [2023-04-29 11:26:41,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +39: [2023-04-29 11:26:41,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +14: [2023-04-29 11:26:41,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 11:26:41,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +42: [2023-04-29 11:26:41,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 11:26:41,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +14: [2023-04-29 11:26:41,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 11:26:41,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +21: [2023-04-29 11:26:41,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 11:26:41,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +21: [2023-04-29 11:26:41,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +25: [2023-04-29 11:26:41,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +14: [2023-04-29 11:26:41,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +28: [2023-04-29 11:26:41,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 11:26:41,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +58: [2023-04-29 11:26:41,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +14: [2023-04-29 11:26:41,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +28: [2023-04-29 11:26:41,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +58: [2023-04-29 11:26:41,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +28: [2023-04-29 11:26:41,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +28: [2023-04-29 11:26:41,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 2: [2023-04-29 11:26:41,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +40: [2023-04-29 11:26:41,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 11:26:41,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 11:26:41,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +15: [2023-04-29 11:26:41,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +40: [2023-04-29 11:26:41,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +22: [2023-04-29 11:26:41,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +22: [2023-04-29 11:26:41,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +15: [2023-04-29 11:26:41,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +36: [2023-04-29 11:26:41,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 11:26:41,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 2: [2023-04-29 11:26:41,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +21: [2023-04-29 11:26:41,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 11:26:41,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 2: [2023-04-29 11:26:41,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +57: [2023-04-29 11:26:41,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +28: [2023-04-29 11:26:41,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +28: [2023-04-29 11:26:41,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +25: [2023-04-29 11:26:41,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +17: [2023-04-29 11:26:41,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 11:26:41,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 11:26:41,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 11:26:41,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 11:26:41,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 11:26:41,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +49: [2023-04-29 11:26:41,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 11:26:41,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +49: [2023-04-29 11:26:41,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 11:26:41,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 11:26:41,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +18: [2023-04-29 11:26:41,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 11:26:41,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +25: [2023-04-29 11:26:41,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +63: [2023-04-29 11:26:41,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +17: [2023-04-29 11:26:41,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +40: [2023-04-29 11:26:41,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 11:26:41,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 11:26:41,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 11:26:41,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +39: [2023-04-29 11:26:41,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 11:26:41,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 11:26:41,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 11:26:41,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 11:26:41,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +36: [2023-04-29 11:26:41,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +56: [2023-04-29 11:26:41,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 11:26:41,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 11:26:41,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +20: [2023-04-29 11:26:41,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 11:26:41,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 11:26:41,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 11:26:41,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 11:26:41,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 11:26:41,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +40: [2023-04-29 11:26:41,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +57: [2023-04-29 11:26:41,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +22: [2023-04-29 11:26:41,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +45: [2023-04-29 11:26:41,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +40: [2023-04-29 11:26:41,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +63: [2023-04-29 11:26:41,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 11:26:41,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 11:26:41,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +57: [2023-04-29 11:26:41,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 3: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 11:26:41,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +42: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +16: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +42: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +57: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +56: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +45: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +42: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +42: [2023-04-29 11:26:41,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +49: [2023-04-29 11:26:41,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +29: [2023-04-29 11:26:41,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +63: [2023-04-29 11:26:41,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +29: [2023-04-29 11:26:41,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +58: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +58: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +20: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +20: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +12: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +20: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +61: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +12: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +20: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +15: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +35: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +24: [2023-04-29 11:26:41,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +20: [2023-04-29 11:26:41,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 11:26:41,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +46: [2023-04-29 11:26:41,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +22: [2023-04-29 11:26:41,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 8: [2023-04-29 11:26:41,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +46: [2023-04-29 11:26:41,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +63: [2023-04-29 11:26:41,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +16: [2023-04-29 11:26:41,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +24: [2023-04-29 11:26:41,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +35: [2023-04-29 11:26:41,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 11:26:41,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 11:26:41,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +20: [2023-04-29 11:26:41,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +35: [2023-04-29 11:26:41,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +63: [2023-04-29 11:26:41,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 3: [2023-04-29 11:26:41,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 3: [2023-04-29 11:26:41,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 3: [2023-04-29 11:26:41,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 3: [2023-04-29 11:26:41,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 6: [2023-04-29 11:26:41,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 11:26:41,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 3: [2023-04-29 11:26:41,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +61: [2023-04-29 11:26:41,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 11:26:41,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +11: [2023-04-29 11:26:41,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +46: [2023-04-29 11:26:41,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 11:26:41,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +45: [2023-04-29 11:26:41,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +61: [2023-04-29 11:26:41,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +16: [2023-04-29 11:26:41,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +45: [2023-04-29 11:26:41,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +22: [2023-04-29 11:26:41,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +35: [2023-04-29 11:26:41,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +35: [2023-04-29 11:26:41,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +19: [2023-04-29 11:26:41,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +35: [2023-04-29 11:26:41,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +18: [2023-04-29 11:26:41,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 11:26:41,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 6: [2023-04-29 11:26:41,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 11:26:41,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 11:26:41,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +31: [2023-04-29 11:26:41,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 11:26:41,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +51: [2023-04-29 11:26:41,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 11:26:41,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +48: [2023-04-29 11:26:41,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 11:26:41,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 11:26:41,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +24: [2023-04-29 11:26:41,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +51: [2023-04-29 11:26:41,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +21: [2023-04-29 11:26:41,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +58: [2023-04-29 11:26:41,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +58: [2023-04-29 11:26:41,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +18: [2023-04-29 11:26:41,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 11:26:41,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +18: [2023-04-29 11:26:41,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 11:26:41,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +63: [2023-04-29 11:26:41,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +31: [2023-04-29 11:26:41,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 11:26:41,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +55: [2023-04-29 11:26:41,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 11:26:41,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +58: [2023-04-29 11:26:41,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +20: [2023-04-29 11:26:41,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +24: [2023-04-29 11:26:41,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 11:26:41,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +58: [2023-04-29 11:26:41,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +19: [2023-04-29 11:26:41,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 11:26:41,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +14: [2023-04-29 11:26:41,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 11:26:41,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +35: [2023-04-29 11:26:41,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 11:26:41,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +55: [2023-04-29 11:26:41,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +19: [2023-04-29 11:26:41,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 11:26:41,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +10: [2023-04-29 11:26:41,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +21: [2023-04-29 11:26:41,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +58: [2023-04-29 11:26:41,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +21: [2023-04-29 11:26:41,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 11:26:41,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +35: [2023-04-29 11:26:41,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +51: [2023-04-29 11:26:41,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 11:26:41,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 11:26:41,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 11:26:41,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +56: [2023-04-29 11:26:41,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 11:26:41,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +21: [2023-04-29 11:26:41,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +31: [2023-04-29 11:26:41,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 1: [2023-04-29 11:26:41,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 1: [2023-04-29 11:26:41,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +35: [2023-04-29 11:26:41,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +35: [2023-04-29 11:26:41,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +35: [2023-04-29 11:26:41,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 1: [2023-04-29 11:26:41,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +21: [2023-04-29 11:26:41,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 11:26:41,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +35: [2023-04-29 11:26:41,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +21: [2023-04-29 11:26:41,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 1: [2023-04-29 11:26:41,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +35: [2023-04-29 11:26:41,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +55: [2023-04-29 11:26:41,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +58: [2023-04-29 11:26:41,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 4: [2023-04-29 11:26:41,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 4: [2023-04-29 11:26:41,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 4: [2023-04-29 11:26:41,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +19: [2023-04-29 11:26:41,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +13: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +48: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +48: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +58: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +13: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +14: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +21: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +29: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +58: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +20: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +21: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +13: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 5: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:41,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 11:26:41,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 11:26:41,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +58: [2023-04-29 11:26:41,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +14: [2023-04-29 11:26:41,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +26: [2023-04-29 11:26:41,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 11:26:41,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +26: [2023-04-29 11:26:41,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 11:26:41,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 11:26:41,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 11:26:41,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +46: [2023-04-29 11:26:41,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +29: [2023-04-29 11:26:41,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:41,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 11:26:41,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +11: [2023-04-29 11:26:41,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +11: [2023-04-29 11:26:41,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 11:26:41,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +26: [2023-04-29 11:26:41,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +26: [2023-04-29 11:26:41,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 11:26:41,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +17: [2023-04-29 11:26:41,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +11: [2023-04-29 11:26:41,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 11:26:41,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +61: [2023-04-29 11:26:41,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +11: [2023-04-29 11:26:41,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +26: [2023-04-29 11:26:41,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 11:26:41,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +41: [2023-04-29 11:26:41,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 11:26:41,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +30: [2023-04-29 11:26:41,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 11:26:41,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 11:26:41,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +53: [2023-04-29 11:26:41,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 11:26:41,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +16: [2023-04-29 11:26:41,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +46: [2023-04-29 11:26:41,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 11:26:41,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 11:26:41,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 11:26:41,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 11:26:41,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 11:26:41,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +46: [2023-04-29 11:26:41,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +17: [2023-04-29 11:26:41,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +10: [2023-04-29 11:26:41,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +10: [2023-04-29 11:26:41,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 11:26:41,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +19: [2023-04-29 11:26:41,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +48: [2023-04-29 11:26:41,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +48: [2023-04-29 11:26:41,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 11:26:41,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 8: [2023-04-29 11:26:41,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +44: [2023-04-29 11:26:41,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 11:26:41,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +61: [2023-04-29 11:26:41,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +61: [2023-04-29 11:26:41,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +10: [2023-04-29 11:26:41,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +46: [2023-04-29 11:26:41,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 11:26:41,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 8: [2023-04-29 11:26:41,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 11:26:41,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +23: [2023-04-29 11:26:41,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +40: [2023-04-29 11:26:41,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +40: [2023-04-29 11:26:41,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +40: [2023-04-29 11:26:41,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +45: [2023-04-29 11:26:41,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +29: [2023-04-29 11:26:41,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +44: [2023-04-29 11:26:41,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +10: [2023-04-29 11:26:41,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +44: [2023-04-29 11:26:41,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +44: [2023-04-29 11:26:41,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +10: [2023-04-29 11:26:41,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +44: [2023-04-29 11:26:41,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 11:26:41,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +47: [2023-04-29 11:26:41,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 11:26:41,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +29: [2023-04-29 11:26:41,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +53: [2023-04-29 11:26:41,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 11:26:41,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 11:26:41,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 11:26:41,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 11:26:41,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 11:26:41,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +16: [2023-04-29 11:26:41,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 11:26:41,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +19: [2023-04-29 11:26:41,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +16: [2023-04-29 11:26:41,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +47: [2023-04-29 11:26:41,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +44: [2023-04-29 11:26:41,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +45: [2023-04-29 11:26:41,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 11:26:41,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 11:26:41,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +23: [2023-04-29 11:26:41,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +23: [2023-04-29 11:26:41,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 11:26:41,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 11:26:41,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +47: [2023-04-29 11:26:41,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 4: [2023-04-29 11:26:41,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +29: [2023-04-29 11:26:41,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 3: [2023-04-29 11:26:41,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +44: [2023-04-29 11:26:41,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +48: [2023-04-29 11:26:41,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +19: [2023-04-29 11:26:41,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 11:26:41,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 11:26:41,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +47: [2023-04-29 11:26:41,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +47: [2023-04-29 11:26:41,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +47: [2023-04-29 11:26:41,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 1: [2023-04-29 11:26:41,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +48: [2023-04-29 11:26:41,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +29: [2023-04-29 11:26:41,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +29: [2023-04-29 11:26:41,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:41,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 4: [2023-04-29 11:26:41,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 11:26:41,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 11:26:41,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +13: [2023-04-29 11:26:41,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +16: [2023-04-29 11:26:41,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 11:26:41,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +47: [2023-04-29 11:26:41,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +28: [2023-04-29 11:26:41,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +16: [2023-04-29 11:26:41,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +16: [2023-04-29 11:26:41,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +51: [2023-04-29 11:26:41,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 11:26:41,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 11:26:41,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 11:26:41,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +29: [2023-04-29 11:26:41,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +30: [2023-04-29 11:26:41,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +41: [2023-04-29 11:26:41,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +11: [2023-04-29 11:26:41,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +40: [2023-04-29 11:26:41,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +41: [2023-04-29 11:26:41,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +11: [2023-04-29 11:26:41,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 11:26:41,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +51: [2023-04-29 11:26:41,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 11:26:41,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +11: [2023-04-29 11:26:41,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +36: [2023-04-29 11:26:41,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +36: [2023-04-29 11:26:41,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +51: [2023-04-29 11:26:41,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +51: [2023-04-29 11:26:41,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +45: [2023-04-29 11:26:41,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +30: [2023-04-29 11:26:41,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +41: [2023-04-29 11:26:41,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +41: [2023-04-29 11:26:41,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +16: [2023-04-29 11:26:41,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +45: [2023-04-29 11:26:41,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +30: [2023-04-29 11:26:41,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +29: [2023-04-29 11:26:41,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +49: [2023-04-29 11:26:41,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +49: [2023-04-29 11:26:41,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +23: [2023-04-29 11:26:41,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +51: [2023-04-29 11:26:41,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +20: [2023-04-29 11:26:41,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +51: [2023-04-29 11:26:41,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +36: [2023-04-29 11:26:41,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +36: [2023-04-29 11:26:41,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +49: [2023-04-29 11:26:41,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +30: [2023-04-29 11:26:41,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 11:26:41,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +20: [2023-04-29 11:26:41,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +36: [2023-04-29 11:26:41,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +29: [2023-04-29 11:26:41,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +45: [2023-04-29 11:26:41,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +49: [2023-04-29 11:26:41,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_25-model_01-model_states.pt. +36: [2023-04-29 11:26:41,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +17: [2023-04-29 11:26:41,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +17: [2023-04-29 11:26:41,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +28: [2023-04-29 11:26:41,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +28: [2023-04-29 11:26:41,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 11:26:41,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +36: [2023-04-29 11:26:41,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +40: [2023-04-29 11:26:41,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 11:26:41,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +20: [2023-04-29 11:26:41,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +36: [2023-04-29 11:26:41,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +20: [2023-04-29 11:26:41,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 11:26:41,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 11:26:41,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +42: [2023-04-29 11:26:41,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 11:26:41,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 11:26:41,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 11:26:41,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 11:26:41,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 11:26:41,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +29: [2023-04-29 11:26:41,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +32: [2023-04-29 11:26:41,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +27: [2023-04-29 11:26:41,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:41,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +28: [2023-04-29 11:26:41,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +40: [2023-04-29 11:26:41,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +42: [2023-04-29 11:26:41,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +17: [2023-04-29 11:26:41,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 11:26:41,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:41,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +45: [2023-04-29 11:26:41,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 11:26:41,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +56: [2023-04-29 11:26:41,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +23: [2023-04-29 11:26:41,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 11:26:41,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +17: [2023-04-29 11:26:41,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +14: [2023-04-29 11:26:41,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +42: [2023-04-29 11:26:41,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +42: [2023-04-29 11:26:41,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +42: [2023-04-29 11:26:41,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +28: [2023-04-29 11:26:41,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +42: [2023-04-29 11:26:41,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +14: [2023-04-29 11:26:41,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +14: [2023-04-29 11:26:41,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +56: [2023-04-29 11:26:41,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 11:26:41,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:41,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +27: [2023-04-29 11:26:41,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +56: [2023-04-29 11:26:41,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +27: [2023-04-29 11:26:41,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 11:26:41,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +32: [2023-04-29 11:26:41,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +17: [2023-04-29 11:26:41,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +32: [2023-04-29 11:26:41,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +27: [2023-04-29 11:26:41,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 11:26:41,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 11:26:41,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +14: [2023-04-29 11:26:41,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +14: [2023-04-29 11:26:41,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +56: [2023-04-29 11:26:41,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +27: [2023-04-29 11:26:41,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +27: [2023-04-29 11:26:41,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. + 3: [2023-04-29 11:26:41,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +40: [2023-04-29 11:26:41,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 11:26:41,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 11:26:41,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +51: [2023-04-29 11:26:41,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 11:26:41,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +27: [2023-04-29 11:26:41,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +51: [2023-04-29 11:26:41,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +27: [2023-04-29 11:26:41,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_03-model_01-model_states.pt. +23: [2023-04-29 11:26:41,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +35: [2023-04-29 11:26:41,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +56: [2023-04-29 11:26:41,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +56: [2023-04-29 11:26:41,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +14: [2023-04-29 11:26:41,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +45: [2023-04-29 11:26:41,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +14: [2023-04-29 11:26:41,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +14: [2023-04-29 11:26:41,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +14: [2023-04-29 11:26:41,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +55: [2023-04-29 11:26:41,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 11:26:41,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +49: [2023-04-29 11:26:41,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 11:26:41,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 11:26:41,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... + 5: [2023-04-29 11:26:41,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 11:26:41,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 5: [2023-04-29 11:26:41,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +56: [2023-04-29 11:26:41,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 3: [2023-04-29 11:26:41,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +51: [2023-04-29 11:26:41,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +20: [2023-04-29 11:26:41,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 11:26:41,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +20: [2023-04-29 11:26:41,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 3: [2023-04-29 11:26:41,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 11:26:41,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. + 1: [2023-04-29 11:26:41,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +14: [2023-04-29 11:26:41,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +49: [2023-04-29 11:26:41,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt... +35: [2023-04-29 11:26:41,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +53: [2023-04-29 11:26:41,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 11:26:41,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +28: [2023-04-29 11:26:41,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 11:26:42,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +26: [2023-04-29 11:26:42,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 11:26:42,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 11:26:42,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +45: [2023-04-29 11:26:42,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +55: [2023-04-29 11:26:42,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +55: [2023-04-29 11:26:42,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +26: [2023-04-29 11:26:42,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +45: [2023-04-29 11:26:42,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +55: [2023-04-29 11:26:42,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +45: [2023-04-29 11:26:42,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +40: [2023-04-29 11:26:42,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 11:26:42,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +20: [2023-04-29 11:26:42,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 11:26:42,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +17: [2023-04-29 11:26:42,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +20: [2023-04-29 11:26:42,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 11:26:42,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +53: [2023-04-29 11:26:42,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +40: [2023-04-29 11:26:42,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 11:26:42,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 11:26:42,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 11:26:42,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... + 3: [2023-04-29 11:26:42,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 11:26:42,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 11:26:42,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +54: [2023-04-29 11:26:42,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 11:26:42,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 11:26:42,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 11:26:42,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 11:26:42,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 4: [2023-04-29 11:26:42,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +51: [2023-04-29 11:26:42,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 11:26:42,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +14: [2023-04-29 11:26:42,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +35: [2023-04-29 11:26:42,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +27: [2023-04-29 11:26:42,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +35: [2023-04-29 11:26:42,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +27: [2023-04-29 11:26:42,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +54: [2023-04-29 11:26:42,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 11:26:42,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 11:26:42,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 4: [2023-04-29 11:26:42,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +14: [2023-04-29 11:26:42,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +27: [2023-04-29 11:26:42,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 11:26:42,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt... +35: [2023-04-29 11:26:42,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 11:26:42,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 11:26:42,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 4: [2023-04-29 11:26:42,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 4: [2023-04-29 11:26:42,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 3: [2023-04-29 11:26:42,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 11:26:42,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 11:26:42,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 11:26:42,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +14: [2023-04-29 11:26:42,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +32: [2023-04-29 11:26:42,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +32: [2023-04-29 11:26:42,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +32: [2023-04-29 11:26:42,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +14: [2023-04-29 11:26:42,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 11:26:42,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +26: [2023-04-29 11:26:42,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 11:26:42,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 4: [2023-04-29 11:26:42,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 1: [2023-04-29 11:26:42,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +14: [2023-04-29 11:26:42,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +26: [2023-04-29 11:26:42,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 11:26:42,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 11:26:42,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 11:26:42,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +26: [2023-04-29 11:26:42,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 11:26:42,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 3: [2023-04-29 11:26:42,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 7: [2023-04-29 11:26:42,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +35: [2023-04-29 11:26:42,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +14: [2023-04-29 11:26:42,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 3: [2023-04-29 11:26:42,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 1: [2023-04-29 11:26:42,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +53: [2023-04-29 11:26:42,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 11:26:42,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 3: [2023-04-29 11:26:42,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 11:26:42,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +17: [2023-04-29 11:26:42,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 3: [2023-04-29 11:26:42,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +27: [2023-04-29 11:26:42,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +32: [2023-04-29 11:26:42,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +17: [2023-04-29 11:26:42,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 11:26:42,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:42,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 11:26:42,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +17: [2023-04-29 11:26:42,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +49: [2023-04-29 11:26:42,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 11:26:42,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 11:26:42,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +34: [2023-04-29 11:26:42,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +34: [2023-04-29 11:26:42,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +49: [2023-04-29 11:26:42,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +49: [2023-04-29 11:26:42,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +17: [2023-04-29 11:26:42,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +34: [2023-04-29 11:26:42,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +34: [2023-04-29 11:26:42,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +49: [2023-04-29 11:26:42,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_00-model_states.pt. +49: [2023-04-29 11:26:42,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +27: [2023-04-29 11:26:42,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +32: [2023-04-29 11:26:42,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 11:26:42,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +49: [2023-04-29 11:26:42,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt... +32: [2023-04-29 11:26:42,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 11:26:42,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +13: [2023-04-29 11:26:42,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +13: [2023-04-29 11:26:42,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +38: [2023-04-29 11:26:42,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +38: [2023-04-29 11:26:42,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +13: [2023-04-29 11:26:42,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +13: [2023-04-29 11:26:42,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +38: [2023-04-29 11:26:42,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +38: [2023-04-29 11:26:42,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 11:26:42,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 11:26:42,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 11:26:42,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 11:26:42,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 11:26:42,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +17: [2023-04-29 11:26:42,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +38: [2023-04-29 11:26:42,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +27: [2023-04-29 11:26:42,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +62: [2023-04-29 11:26:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 11:26:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 11:26:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 11:26:42,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 11:26:42,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 11:26:42,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 11:26:42,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 11:26:42,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +27: [2023-04-29 11:26:42,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +54: [2023-04-29 11:26:42,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 11:26:42,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 11:26:42,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +27: [2023-04-29 11:26:42,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +60: [2023-04-29 11:26:42,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 11:26:42,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 11:26:42,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 11:26:42,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 11:26:42,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 11:26:42,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 11:26:42,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 11:26:42,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +27: [2023-04-29 11:26:42,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +60: [2023-04-29 11:26:42,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 11:26:42,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 11:26:42,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:42,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +32: [2023-04-29 11:26:42,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 11:26:42,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 11:26:42,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 11:26:42,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 11:26:42,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +27: [2023-04-29 11:26:42,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +54: [2023-04-29 11:26:42,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +27: [2023-04-29 11:26:42,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 7: [2023-04-29 11:26:42,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:42,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... + 7: [2023-04-29 11:26:42,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:42,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. +27: [2023-04-29 11:26:42,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +43: [2023-04-29 11:26:42,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 11:26:42,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 11:26:42,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 11:26:42,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 11:26:42,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +61: [2023-04-29 11:26:42,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +53: [2023-04-29 11:26:42,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +53: [2023-04-29 11:26:42,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +61: [2023-04-29 11:26:42,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +53: [2023-04-29 11:26:42,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +53: [2023-04-29 11:26:42,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +61: [2023-04-29 11:26:42,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +43: [2023-04-29 11:26:42,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 11:26:42,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 11:26:42,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +27: [2023-04-29 11:26:42,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +27: [2023-04-29 11:26:42,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt... +43: [2023-04-29 11:26:42,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 11:26:42,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +33: [2023-04-29 11:26:42,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +33: [2023-04-29 11:26:42,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +33: [2023-04-29 11:26:42,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +22: [2023-04-29 11:26:42,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 11:26:42,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +60: [2023-04-29 11:26:42,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +60: [2023-04-29 11:26:42,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +22: [2023-04-29 11:26:42,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 11:26:42,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +32: [2023-04-29 11:26:42,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 11:26:42,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +62: [2023-04-29 11:26:42,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +60: [2023-04-29 11:26:42,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +60: [2023-04-29 11:26:42,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. + 7: [2023-04-29 11:26:42,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +54: [2023-04-29 11:26:42,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +22: [2023-04-29 11:26:42,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +36: [2023-04-29 11:26:42,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 11:26:42,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 11:26:42,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 11:26:42,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 11:26:42,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +50: [2023-04-29 11:26:42,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +50: [2023-04-29 11:26:42,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +50: [2023-04-29 11:26:42,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +32: [2023-04-29 11:26:42,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +22: [2023-04-29 11:26:42,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +62: [2023-04-29 11:26:42,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +62: [2023-04-29 11:26:42,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +22: [2023-04-29 11:26:42,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +54: [2023-04-29 11:26:42,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +59: [2023-04-29 11:26:42,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +59: [2023-04-29 11:26:42,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +54: [2023-04-29 11:26:42,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +59: [2023-04-29 11:26:42,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +59: [2023-04-29 11:26:42,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +22: [2023-04-29 11:26:42,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +52: [2023-04-29 11:26:42,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +52: [2023-04-29 11:26:42,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +36: [2023-04-29 11:26:42,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +36: [2023-04-29 11:26:42,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +36: [2023-04-29 11:26:42,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +36: [2023-04-29 11:26:42,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 11:26:42,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +52: [2023-04-29 11:26:42,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +53: [2023-04-29 11:26:42,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 11:26:42,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +32: [2023-04-29 11:26:42,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 11:26:42,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +32: [2023-04-29 11:26:42,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +61: [2023-04-29 11:26:42,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 11:26:42,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 11:26:42,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 11:26:42,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +53: [2023-04-29 11:26:42,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 11:26:42,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +32: [2023-04-29 11:26:42,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +38: [2023-04-29 11:26:42,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +38: [2023-04-29 11:26:42,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 11:26:42,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 11:26:42,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +33: [2023-04-29 11:26:42,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 11:26:42,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +13: [2023-04-29 11:26:42,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 11:26:42,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 11:26:42,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 11:26:42,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 11:26:42,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +60: [2023-04-29 11:26:42,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 11:26:42,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +33: [2023-04-29 11:26:42,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 11:26:42,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 11:26:42,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +38: [2023-04-29 11:26:42,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 11:26:42,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +13: [2023-04-29 11:26:42,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +62: [2023-04-29 11:26:42,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 11:26:42,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +62: [2023-04-29 11:26:42,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +13: [2023-04-29 11:26:42,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 11:26:42,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +10: [2023-04-29 11:26:42,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 11:26:42,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 11:26:42,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +10: [2023-04-29 11:26:42,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 11:26:42,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +25: [2023-04-29 11:26:42,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +25: [2023-04-29 11:26:42,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 11:26:42,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 11:26:42,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 11:26:42,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +60: [2023-04-29 11:26:42,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 11:26:42,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +59: [2023-04-29 11:26:42,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +59: [2023-04-29 11:26:42,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 11:26:42,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +54: [2023-04-29 11:26:42,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +54: [2023-04-29 11:26:42,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +62: [2023-04-29 11:26:42,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 11:26:42,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 11:26:42,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +59: [2023-04-29 11:26:42,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +25: [2023-04-29 11:26:42,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +25: [2023-04-29 11:26:42,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 11:26:42,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +59: [2023-04-29 11:26:42,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 11:26:42,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +52: [2023-04-29 11:26:42,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 11:26:42,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +25: [2023-04-29 11:26:42,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 11:26:42,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +25: [2023-04-29 11:26:42,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +10: [2023-04-29 11:26:42,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +60: [2023-04-29 11:26:42,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 11:26:42,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 11:26:42,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 11:26:42,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +25: [2023-04-29 11:26:42,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +25: [2023-04-29 11:26:42,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 11:26:42,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +50: [2023-04-29 11:26:42,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +60: [2023-04-29 11:26:42,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 11:26:42,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +33: [2023-04-29 11:26:42,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 11:26:42,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 11:26:42,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +62: [2023-04-29 11:26:42,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 11:26:42,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 11:26:42,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +38: [2023-04-29 11:26:42,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +38: [2023-04-29 11:26:42,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 11:26:42,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +62: [2023-04-29 11:26:42,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 11:26:42,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +38: [2023-04-29 11:26:42,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 11:26:42,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 11:26:42,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +32: [2023-04-29 11:26:42,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +33: [2023-04-29 11:26:42,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 11:26:42,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 11:26:42,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +32: [2023-04-29 11:26:42,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 11:26:42,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +15: [2023-04-29 11:26:42,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 11:26:42,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 11:26:42,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +54: [2023-04-29 11:26:42,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 11:26:42,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 11:26:42,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 11:26:42,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 11:26:42,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 11:26:42,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 11:26:42,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +15: [2023-04-29 11:26:42,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +33: [2023-04-29 11:26:42,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 11:26:42,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 11:26:42,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 11:26:42,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 11:26:42,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 11:26:42,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 11:26:42,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 11:26:42,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +18: [2023-04-29 11:26:42,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +18: [2023-04-29 11:26:42,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 11:26:42,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 11:26:42,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 11:26:42,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 11:26:42,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 11:26:42,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +22: [2023-04-29 11:26:42,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +43: [2023-04-29 11:26:42,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +15: [2023-04-29 11:26:42,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +63: [2023-04-29 11:26:42,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 11:26:42,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 11:26:42,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 11:26:42,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +18: [2023-04-29 11:26:42,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 11:26:42,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 11:26:42,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 11:26:42,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +36: [2023-04-29 11:26:42,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 11:26:42,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 11:26:42,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 11:26:42,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 11:26:42,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 11:26:42,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 11:26:42,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 11:26:42,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 11:26:42,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 11:26:42,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +22: [2023-04-29 11:26:42,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 11:26:42,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +43: [2023-04-29 11:26:42,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +43: [2023-04-29 11:26:42,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +43: [2023-04-29 11:26:42,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +53: [2023-04-29 11:26:42,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +53: [2023-04-29 11:26:42,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +22: [2023-04-29 11:26:42,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +62: [2023-04-29 11:26:42,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 11:26:42,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 11:26:42,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +62: [2023-04-29 11:26:42,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +43: [2023-04-29 11:26:42,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 11:26:42,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 11:26:42,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +53: [2023-04-29 11:26:42,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +61: [2023-04-29 11:26:42,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 11:26:42,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 11:26:42,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +47: [2023-04-29 11:26:42,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +47: [2023-04-29 11:26:42,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +13: [2023-04-29 11:26:42,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +53: [2023-04-29 11:26:42,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 11:26:42,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 11:26:42,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +22: [2023-04-29 11:26:42,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 11:26:42,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 11:26:42,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +47: [2023-04-29 11:26:42,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 11:26:42,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 11:26:42,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +60: [2023-04-29 11:26:42,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 11:26:42,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +61: [2023-04-29 11:26:42,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +61: [2023-04-29 11:26:42,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +47: [2023-04-29 11:26:42,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 11:26:42,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 11:26:42,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 11:26:42,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +33: [2023-04-29 11:26:42,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +60: [2023-04-29 11:26:42,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 11:26:42,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +60: [2023-04-29 11:26:42,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +12: [2023-04-29 11:26:42,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +12: [2023-04-29 11:26:42,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +12: [2023-04-29 11:26:42,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +12: [2023-04-29 11:26:42,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +47: [2023-04-29 11:26:42,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 11:26:42,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +46: [2023-04-29 11:26:42,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +46: [2023-04-29 11:26:42,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +46: [2023-04-29 11:26:42,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +13: [2023-04-29 11:26:42,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 11:26:42,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +46: [2023-04-29 11:26:42,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +31: [2023-04-29 11:26:42,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +60: [2023-04-29 11:26:42,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +13: [2023-04-29 11:26:42,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +47: [2023-04-29 11:26:42,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 11:26:42,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +10: [2023-04-29 11:26:42,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +33: [2023-04-29 11:26:42,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 11:26:42,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +12: [2023-04-29 11:26:42,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +25: [2023-04-29 11:26:42,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +25: [2023-04-29 11:26:42,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +12: [2023-04-29 11:26:42,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 11:26:42,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 11:26:42,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +36: [2023-04-29 11:26:42,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 11:26:42,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 11:26:42,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 11:26:42,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +37: [2023-04-29 11:26:42,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +62: [2023-04-29 11:26:42,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 11:26:42,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +31: [2023-04-29 11:26:42,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 11:26:42,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 11:26:42,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +36: [2023-04-29 11:26:42,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +62: [2023-04-29 11:26:42,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 11:26:42,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +43: [2023-04-29 11:26:42,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 11:26:42,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +33: [2023-04-29 11:26:42,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +37: [2023-04-29 11:26:42,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +25: [2023-04-29 11:26:42,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +37: [2023-04-29 11:26:42,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +10: [2023-04-29 11:26:42,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +43: [2023-04-29 11:26:42,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 11:26:42,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +43: [2023-04-29 11:26:42,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 11:26:42,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +25: [2023-04-29 11:26:42,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +62: [2023-04-29 11:26:42,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +43: [2023-04-29 11:26:42,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 11:26:42,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +62: [2023-04-29 11:26:42,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +22: [2023-04-29 11:26:42,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 11:26:42,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 11:26:42,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +54: [2023-04-29 11:26:42,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +22: [2023-04-29 11:26:42,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +48: [2023-04-29 11:26:42,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +48: [2023-04-29 11:26:42,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +60: [2023-04-29 11:26:42,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 11:26:42,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 11:26:42,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. + 0: [2023-04-29 11:26:42,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +48: [2023-04-29 11:26:42,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +26: [2023-04-29 11:26:42,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +26: [2023-04-29 11:26:42,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +54: [2023-04-29 11:26:42,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +33: [2023-04-29 11:26:42,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 11:26:42,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +26: [2023-04-29 11:26:42,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +10: [2023-04-29 11:26:42,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 11:26:42,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +54: [2023-04-29 11:26:42,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +54: [2023-04-29 11:26:42,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +33: [2023-04-29 11:26:42,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +13: [2023-04-29 11:26:42,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +46: [2023-04-29 11:26:42,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 11:26:42,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 11:26:42,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 11:26:42,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +63: [2023-04-29 11:26:42,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +13: [2023-04-29 11:26:42,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 11:26:42,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 11:26:42,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +54: [2023-04-29 11:26:42,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +46: [2023-04-29 11:26:42,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +46: [2023-04-29 11:26:42,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 11:26:42,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 11:26:42,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +33: [2023-04-29 11:26:42,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +25: [2023-04-29 11:26:42,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 11:26:42,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 11:26:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +19: [2023-04-29 11:26:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +33: [2023-04-29 11:26:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 11:26:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 11:26:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +19: [2023-04-29 11:26:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +15: [2023-04-29 11:26:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 11:26:42,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +38: [2023-04-29 11:26:42,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +38: [2023-04-29 11:26:42,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +38: [2023-04-29 11:26:42,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +18: [2023-04-29 11:26:42,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +18: [2023-04-29 11:26:42,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 11:26:42,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +38: [2023-04-29 11:26:42,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +37: [2023-04-29 11:26:42,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 11:26:42,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +25: [2023-04-29 11:26:42,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +37: [2023-04-29 11:26:42,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +37: [2023-04-29 11:26:42,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 11:26:42,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 11:26:42,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 11:26:42,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +37: [2023-04-29 11:26:42,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 11:26:42,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +31: [2023-04-29 11:26:42,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +39: [2023-04-29 11:26:42,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +39: [2023-04-29 11:26:42,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +39: [2023-04-29 11:26:42,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +10: [2023-04-29 11:26:42,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +39: [2023-04-29 11:26:42,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +48: [2023-04-29 11:26:42,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +48: [2023-04-29 11:26:42,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +11: [2023-04-29 11:26:42,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +11: [2023-04-29 11:26:42,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +11: [2023-04-29 11:26:42,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +11: [2023-04-29 11:26:42,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 8: [2023-04-29 11:26:42,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 8: [2023-04-29 11:26:42,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +41: [2023-04-29 11:26:42,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +41: [2023-04-29 11:26:42,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +41: [2023-04-29 11:26:42,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. + 7: [2023-04-29 11:26:42,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 7: [2023-04-29 11:26:42,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 7: [2023-04-29 11:26:42,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +63: [2023-04-29 11:26:42,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 11:26:42,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. + 7: [2023-04-29 11:26:42,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +10: [2023-04-29 11:26:42,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +11: [2023-04-29 11:26:42,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +48: [2023-04-29 11:26:42,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +48: [2023-04-29 11:26:42,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +24: [2023-04-29 11:26:42,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +24: [2023-04-29 11:26:42,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +24: [2023-04-29 11:26:42,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +63: [2023-04-29 11:26:42,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 9: [2023-04-29 11:26:42,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +11: [2023-04-29 11:26:42,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 9: [2023-04-29 11:26:42,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +11: [2023-04-29 11:26:42,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +11: [2023-04-29 11:26:42,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +26: [2023-04-29 11:26:42,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 11:26:42,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +24: [2023-04-29 11:26:42,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +33: [2023-04-29 11:26:42,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +29: [2023-04-29 11:26:42,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 11:26:42,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 11:26:42,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 11:26:42,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:42,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +63: [2023-04-29 11:26:42,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 11:26:42,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 11:26:42,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +26: [2023-04-29 11:26:42,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 11:26:42,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 11:26:42,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +50: [2023-04-29 11:26:42,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 11:26:42,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 11:26:42,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 11:26:42,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 11:26:42,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +26: [2023-04-29 11:26:42,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 11:26:42,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 11:26:42,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 11:26:42,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 11:26:42,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:42,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 11:26:42,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 11:26:42,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +29: [2023-04-29 11:26:42,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:42,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:42,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:42,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:42,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:42,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +33: [2023-04-29 11:26:42,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +18: [2023-04-29 11:26:42,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +50: [2023-04-29 11:26:42,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +50: [2023-04-29 11:26:42,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +50: [2023-04-29 11:26:42,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +38: [2023-04-29 11:26:42,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 11:26:42,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +18: [2023-04-29 11:26:42,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +33: [2023-04-29 11:26:42,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +50: [2023-04-29 11:26:42,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... + 1: [2023-04-29 11:26:42,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 1: [2023-04-29 11:26:42,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 0: [2023-04-29 11:26:42,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +38: [2023-04-29 11:26:42,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +18: [2023-04-29 11:26:42,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 11:26:42,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +38: [2023-04-29 11:26:42,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +12: [2023-04-29 11:26:42,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +12: [2023-04-29 11:26:42,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +43: [2023-04-29 11:26:42,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 11:26:42,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +41: [2023-04-29 11:26:42,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +50: [2023-04-29 11:26:42,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +50: [2023-04-29 11:26:42,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 11:26:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +12: [2023-04-29 11:26:42,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +50: [2023-04-29 11:26:42,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +39: [2023-04-29 11:26:42,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 11:26:42,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 11:26:42,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 11:26:42,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +34: [2023-04-29 11:26:42,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 11:26:42,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 11:26:42,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +47: [2023-04-29 11:26:42,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +43: [2023-04-29 11:26:42,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... + 8: [2023-04-29 11:26:42,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +34: [2023-04-29 11:26:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +47: [2023-04-29 11:26:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 11:26:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 11:26:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 11:26:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 11:26:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +34: [2023-04-29 11:26:42,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 11:26:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +31: [2023-04-29 11:26:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +31: [2023-04-29 11:26:42,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +31: [2023-04-29 11:26:42,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +41: [2023-04-29 11:26:42,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 11:26:42,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +41: [2023-04-29 11:26:42,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +63: [2023-04-29 11:26:42,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 11:26:42,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +63: [2023-04-29 11:26:42,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 11:26:42,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 11:26:42,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +41: [2023-04-29 11:26:42,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 11:26:42,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +24: [2023-04-29 11:26:42,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +34: [2023-04-29 11:26:42,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... + 6: [2023-04-29 11:26:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 11:26:42,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 11:26:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 11:26:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 11:26:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 11:26:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 11:26:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +15: [2023-04-29 11:26:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +15: [2023-04-29 11:26:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +20: [2023-04-29 11:26:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +21: [2023-04-29 11:26:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 11:26:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 11:26:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +34: [2023-04-29 11:26:42,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +20: [2023-04-29 11:26:42,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +20: [2023-04-29 11:26:42,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +24: [2023-04-29 11:26:42,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 11:26:42,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +20: [2023-04-29 11:26:42,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +43: [2023-04-29 11:26:42,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 11:26:42,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +23: [2023-04-29 11:26:42,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +47: [2023-04-29 11:26:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +23: [2023-04-29 11:26:42,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 11:26:42,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 11:26:42,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +34: [2023-04-29 11:26:42,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +34: [2023-04-29 11:26:42,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 11:26:42,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +43: [2023-04-29 11:26:42,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +51: [2023-04-29 11:26:42,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +24: [2023-04-29 11:26:42,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 11:26:42,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +37: [2023-04-29 11:26:42,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 11:26:42,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 11:26:42,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 11:26:42,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 11:26:42,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 11:26:42,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +51: [2023-04-29 11:26:42,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 11:26:42,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +23: [2023-04-29 11:26:42,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 11:26:42,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 11:26:42,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 11:26:42,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 11:26:42,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 11:26:42,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +21: [2023-04-29 11:26:42,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +23: [2023-04-29 11:26:42,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 11:26:42,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 11:26:42,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +23: [2023-04-29 11:26:42,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 11:26:42,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 11:26:42,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +18: [2023-04-29 11:26:42,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +18: [2023-04-29 11:26:42,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +18: [2023-04-29 11:26:42,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +23: [2023-04-29 11:26:42,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +18: [2023-04-29 11:26:42,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +24: [2023-04-29 11:26:42,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 11:26:42,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +23: [2023-04-29 11:26:42,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +57: [2023-04-29 11:26:42,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +37: [2023-04-29 11:26:42,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +37: [2023-04-29 11:26:42,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 11:26:42,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +57: [2023-04-29 11:26:42,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +57: [2023-04-29 11:26:42,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +37: [2023-04-29 11:26:42,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +37: [2023-04-29 11:26:42,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +37: [2023-04-29 11:26:42,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 11:26:42,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +55: [2023-04-29 11:26:42,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +55: [2023-04-29 11:26:42,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +24: [2023-04-29 11:26:42,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 11:26:42,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 11:26:42,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +12: [2023-04-29 11:26:42,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +23: [2023-04-29 11:26:42,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 11:26:42,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +37: [2023-04-29 11:26:42,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +41: [2023-04-29 11:26:42,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 11:26:42,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 11:26:42,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 11:26:42,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 6: [2023-04-29 11:26:42,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 6: [2023-04-29 11:26:42,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 6: [2023-04-29 11:26:42,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +12: [2023-04-29 11:26:42,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 11:26:42,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 11:26:42,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 11:26:42,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +59: [2023-04-29 11:26:42,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 11:26:42,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 11:26:42,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 11:26:42,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 11:26:42,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 11:26:42,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 11:26:42,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 11:26:42,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 11:26:42,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 11:26:42,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 11:26:42,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 11:26:42,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 11:26:42,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +58: [2023-04-29 11:26:42,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +58: [2023-04-29 11:26:42,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +41: [2023-04-29 11:26:42,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 11:26:42,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +58: [2023-04-29 11:26:42,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +31: [2023-04-29 11:26:42,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +59: [2023-04-29 11:26:42,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +59: [2023-04-29 11:26:42,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +59: [2023-04-29 11:26:42,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +20: [2023-04-29 11:26:42,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 11:26:42,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +20: [2023-04-29 11:26:42,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 11:26:42,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +11: [2023-04-29 11:26:42,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 11:26:42,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +26: [2023-04-29 11:26:42,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +37: [2023-04-29 11:26:42,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 11:26:42,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +20: [2023-04-29 11:26:42,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +59: [2023-04-29 11:26:42,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +59: [2023-04-29 11:26:42,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +15: [2023-04-29 11:26:42,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +15: [2023-04-29 11:26:42,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +59: [2023-04-29 11:26:42,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +59: [2023-04-29 11:26:42,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +59: [2023-04-29 11:26:42,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +20: [2023-04-29 11:26:42,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:42,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 11:26:42,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +18: [2023-04-29 11:26:42,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +18: [2023-04-29 11:26:42,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +38: [2023-04-29 11:26:42,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 11:26:42,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 11:26:42,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 11:26:42,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +18: [2023-04-29 11:26:42,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +37: [2023-04-29 11:26:42,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +37: [2023-04-29 11:26:42,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +49: [2023-04-29 11:26:42,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +49: [2023-04-29 11:26:42,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +14: [2023-04-29 11:26:42,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 11:26:42,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +18: [2023-04-29 11:26:42,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +19: [2023-04-29 11:26:42,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +19: [2023-04-29 11:26:42,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 11:26:42,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +57: [2023-04-29 11:26:42,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 11:26:42,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +29: [2023-04-29 11:26:42,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 11:26:42,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 11:26:42,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 11:26:42,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 11:26:42,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +30: [2023-04-29 11:26:42,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +30: [2023-04-29 11:26:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +14: [2023-04-29 11:26:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 11:26:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 11:26:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +38: [2023-04-29 11:26:42,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +49: [2023-04-29 11:26:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +49: [2023-04-29 11:26:42,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +26: [2023-04-29 11:26:42,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 11:26:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 11:26:42,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +37: [2023-04-29 11:26:42,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +30: [2023-04-29 11:26:42,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 7: [2023-04-29 11:26:42,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 11:26:42,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +49: [2023-04-29 11:26:42,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +11: [2023-04-29 11:26:42,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +11: [2023-04-29 11:26:42,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +11: [2023-04-29 11:26:42,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +19: [2023-04-29 11:26:42,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +19: [2023-04-29 11:26:42,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 6: [2023-04-29 11:26:42,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:42,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +26: [2023-04-29 11:26:42,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +28: [2023-04-29 11:26:42,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +28: [2023-04-29 11:26:42,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +41: [2023-04-29 11:26:42,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +28: [2023-04-29 11:26:42,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +39: [2023-04-29 11:26:42,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 11:26:42,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +28: [2023-04-29 11:26:42,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 11:26:42,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +38: [2023-04-29 11:26:42,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +10: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +10: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +38: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +26: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 8: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +63: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. + 9: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +53: [2023-04-29 11:26:42,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +53: [2023-04-29 11:26:42,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +53: [2023-04-29 11:26:42,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +63: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +53: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +14: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +49: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +26: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +10: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +17: [2023-04-29 11:26:42,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 11:26:42,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 11:26:42,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 11:26:42,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 11:26:42,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 11:26:42,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 11:26:42,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +35: [2023-04-29 11:26:42,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +35: [2023-04-29 11:26:42,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +35: [2023-04-29 11:26:42,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +11: [2023-04-29 11:26:42,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 11:26:42,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +35: [2023-04-29 11:26:42,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +28: [2023-04-29 11:26:42,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 11:26:42,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +41: [2023-04-29 11:26:42,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +39: [2023-04-29 11:26:42,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 9: [2023-04-29 11:26:42,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +39: [2023-04-29 11:26:42,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +14: [2023-04-29 11:26:42,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +39: [2023-04-29 11:26:42,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... + 1: [2023-04-29 11:26:42,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 11:26:42,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 11:26:42,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +56: [2023-04-29 11:26:42,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +56: [2023-04-29 11:26:42,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +38: [2023-04-29 11:26:42,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +28: [2023-04-29 11:26:42,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +38: [2023-04-29 11:26:42,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 11:26:42,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 11:26:42,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 11:26:42,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +50: [2023-04-29 11:26:42,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 11:26:42,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +17: [2023-04-29 11:26:42,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 11:26:42,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 7: [2023-04-29 11:26:42,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +41: [2023-04-29 11:26:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +39: [2023-04-29 11:26:42,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... + 8: [2023-04-29 11:26:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 11:26:42,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +58: [2023-04-29 11:26:42,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 11:26:42,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 11:26:42,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +50: [2023-04-29 11:26:42,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 11:26:42,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +50: [2023-04-29 11:26:42,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 11:26:42,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +17: [2023-04-29 11:26:42,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +56: [2023-04-29 11:26:42,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 11:26:42,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 11:26:42,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 11:26:42,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +56: [2023-04-29 11:26:42,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 11:26:42,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +17: [2023-04-29 11:26:42,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +38: [2023-04-29 11:26:42,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +58: [2023-04-29 11:26:42,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 11:26:42,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 9: [2023-04-29 11:26:42,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 8: [2023-04-29 11:26:42,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 8: [2023-04-29 11:26:42,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +41: [2023-04-29 11:26:42,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... + 8: [2023-04-29 11:26:42,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +41: [2023-04-29 11:26:42,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 11:26:42,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 11:26:42,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 11:26:42,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 11:26:42,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 11:26:42,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 11:26:42,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +29: [2023-04-29 11:26:42,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +56: [2023-04-29 11:26:42,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +20: [2023-04-29 11:26:42,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 11:26:42,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +56: [2023-04-29 11:26:42,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +39: [2023-04-29 11:26:42,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +41: [2023-04-29 11:26:42,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +20: [2023-04-29 11:26:42,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 11:26:42,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 11:26:42,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +41: [2023-04-29 11:26:42,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +56: [2023-04-29 11:26:42,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 11:26:42,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +23: [2023-04-29 11:26:42,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +23: [2023-04-29 11:26:42,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +23: [2023-04-29 11:26:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +25: [2023-04-29 11:26:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +25: [2023-04-29 11:26:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +25: [2023-04-29 11:26:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +25: [2023-04-29 11:26:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +52: [2023-04-29 11:26:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 11:26:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 11:26:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 11:26:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 11:26:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 11:26:42,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 11:26:42,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 11:26:42,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +34: [2023-04-29 11:26:42,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 11:26:42,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +30: [2023-04-29 11:26:42,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +58: [2023-04-29 11:26:42,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +30: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +58: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +30: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +21: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +47: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +47: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +57: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +20: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 11:26:42,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +34: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +47: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +58: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +20: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +48: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +11: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +48: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +20: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +48: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +20: [2023-04-29 11:26:42,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +51: [2023-04-29 11:26:42,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +11: [2023-04-29 11:26:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +11: [2023-04-29 11:26:42,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +23: [2023-04-29 11:26:42,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +23: [2023-04-29 11:26:42,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 11:26:42,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +52: [2023-04-29 11:26:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +52: [2023-04-29 11:26:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +52: [2023-04-29 11:26:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +52: [2023-04-29 11:26:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 11:26:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +21: [2023-04-29 11:26:42,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 11:26:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +52: [2023-04-29 11:26:42,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +52: [2023-04-29 11:26:42,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +46: [2023-04-29 11:26:42,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +57: [2023-04-29 11:26:42,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 11:26:42,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +48: [2023-04-29 11:26:42,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +46: [2023-04-29 11:26:42,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 11:26:42,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +37: [2023-04-29 11:26:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 11:26:42,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +46: [2023-04-29 11:26:42,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +24: [2023-04-29 11:26:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +46: [2023-04-29 11:26:42,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +46: [2023-04-29 11:26:42,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +46: [2023-04-29 11:26:42,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 11:26:42,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +29: [2023-04-29 11:26:42,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +57: [2023-04-29 11:26:42,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 11:26:42,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 11:26:42,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +46: [2023-04-29 11:26:42,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +57: [2023-04-29 11:26:42,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 11:26:42,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 11:26:42,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 11:26:42,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 11:26:42,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +10: [2023-04-29 11:26:42,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 11:26:42,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +46: [2023-04-29 11:26:42,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 11:26:42,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 11:26:42,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +44: [2023-04-29 11:26:42,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +23: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +44: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +44: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +44: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +48: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +45: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +48: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +44: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +45: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. + 1: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +44: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +45: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +48: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +48: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +42: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +63: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +48: [2023-04-29 11:26:42,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 11:26:42,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 11:26:42,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +48: [2023-04-29 11:26:42,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +48: [2023-04-29 11:26:42,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... + 0: [2023-04-29 11:26:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +40: [2023-04-29 11:26:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +40: [2023-04-29 11:26:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +35: [2023-04-29 11:26:42,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 11:26:42,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +40: [2023-04-29 11:26:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +56: [2023-04-29 11:26:42,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 11:26:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +42: [2023-04-29 11:26:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 11:26:42,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 11:26:42,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +56: [2023-04-29 11:26:42,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 11:26:42,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +42: [2023-04-29 11:26:42,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 11:26:42,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +55: [2023-04-29 11:26:42,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +31: [2023-04-29 11:26:42,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +34: [2023-04-29 11:26:42,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 11:26:42,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 11:26:42,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 11:26:42,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 11:26:42,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 11:26:42,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 11:26:42,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 11:26:42,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 11:26:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +24: [2023-04-29 11:26:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +24: [2023-04-29 11:26:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +56: [2023-04-29 11:26:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +42: [2023-04-29 11:26:42,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +42: [2023-04-29 11:26:42,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +24: [2023-04-29 11:26:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +44: [2023-04-29 11:26:42,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 11:26:42,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +42: [2023-04-29 11:26:42,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 11:26:42,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +37: [2023-04-29 11:26:42,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 11:26:42,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +31: [2023-04-29 11:26:42,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +37: [2023-04-29 11:26:42,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +50: [2023-04-29 11:26:42,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 11:26:42,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +31: [2023-04-29 11:26:42,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 11:26:42,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 11:26:42,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 11:26:42,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 11:26:42,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 11:26:42,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 11:26:42,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +42: [2023-04-29 11:26:42,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +15: [2023-04-29 11:26:42,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 11:26:42,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +31: [2023-04-29 11:26:42,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 11:26:42,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +51: [2023-04-29 11:26:42,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 11:26:42,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 11:26:42,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +41: [2023-04-29 11:26:42,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +29: [2023-04-29 11:26:42,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +29: [2023-04-29 11:26:42,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +41: [2023-04-29 11:26:42,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +29: [2023-04-29 11:26:42,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +23: [2023-04-29 11:26:42,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +25: [2023-04-29 11:26:42,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:42,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +31: [2023-04-29 11:26:42,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +20: [2023-04-29 11:26:42,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 11:26:42,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +39: [2023-04-29 11:26:42,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 11:26:42,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +31: [2023-04-29 11:26:42,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +25: [2023-04-29 11:26:42,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +31: [2023-04-29 11:26:42,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +25: [2023-04-29 11:26:42,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +47: [2023-04-29 11:26:42,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +25: [2023-04-29 11:26:42,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +24: [2023-04-29 11:26:42,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +20: [2023-04-29 11:26:42,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 0: [2023-04-29 11:26:42,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 0: [2023-04-29 11:26:42,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +50: [2023-04-29 11:26:42,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +15: [2023-04-29 11:26:42,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 11:26:42,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +15: [2023-04-29 11:26:42,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +47: [2023-04-29 11:26:42,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +47: [2023-04-29 11:26:42,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +23: [2023-04-29 11:26:42,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +23: [2023-04-29 11:26:42,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +39: [2023-04-29 11:26:42,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 11:26:42,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +39: [2023-04-29 11:26:42,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +23: [2023-04-29 11:26:42,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 11:26:42,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 11:26:42,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +34: [2023-04-29 11:26:42,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +24: [2023-04-29 11:26:42,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +50: [2023-04-29 11:26:42,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 11:26:42,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:42,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +51: [2023-04-29 11:26:42,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +18: [2023-04-29 11:26:42,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +24: [2023-04-29 11:26:42,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +57: [2023-04-29 11:26:42,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 11:26:42,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +16: [2023-04-29 11:26:42,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 11:26:42,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 11:26:42,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 11:26:42,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +16: [2023-04-29 11:26:42,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +51: [2023-04-29 11:26:42,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +21: [2023-04-29 11:26:42,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 11:26:42,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +21: [2023-04-29 11:26:42,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 11:26:42,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +18: [2023-04-29 11:26:42,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 11:26:42,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +39: [2023-04-29 11:26:42,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +59: [2023-04-29 11:26:42,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 11:26:42,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 11:26:42,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +24: [2023-04-29 11:26:42,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 11:26:42,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +39: [2023-04-29 11:26:42,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 11:26:42,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +45: [2023-04-29 11:26:42,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +15: [2023-04-29 11:26:42,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +15: [2023-04-29 11:26:42,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +39: [2023-04-29 11:26:42,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 11:26:42,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +20: [2023-04-29 11:26:42,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +34: [2023-04-29 11:26:42,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +18: [2023-04-29 11:26:42,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +39: [2023-04-29 11:26:42,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +23: [2023-04-29 11:26:42,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +54: [2023-04-29 11:26:42,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 11:26:42,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +23: [2023-04-29 11:26:42,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +49: [2023-04-29 11:26:42,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +57: [2023-04-29 11:26:42,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +57: [2023-04-29 11:26:42,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +18: [2023-04-29 11:26:42,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +45: [2023-04-29 11:26:42,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 11:26:42,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +16: [2023-04-29 11:26:42,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +16: [2023-04-29 11:26:42,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 11:26:42,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +18: [2023-04-29 11:26:42,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +16: [2023-04-29 11:26:42,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +59: [2023-04-29 11:26:42,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +44: [2023-04-29 11:26:42,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +34: [2023-04-29 11:26:42,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 11:26:42,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +54: [2023-04-29 11:26:42,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 11:26:42,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +18: [2023-04-29 11:26:42,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +23: [2023-04-29 11:26:42,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +45: [2023-04-29 11:26:42,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +45: [2023-04-29 11:26:42,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +16: [2023-04-29 11:26:42,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +49: [2023-04-29 11:26:42,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +40: [2023-04-29 11:26:42,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +44: [2023-04-29 11:26:42,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +18: [2023-04-29 11:26:42,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +37: [2023-04-29 11:26:42,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 11:26:42,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +20: [2023-04-29 11:26:42,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 6: [2023-04-29 11:26:42,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +54: [2023-04-29 11:26:42,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +20: [2023-04-29 11:26:42,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +57: [2023-04-29 11:26:42,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +28: [2023-04-29 11:26:42,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +54: [2023-04-29 11:26:42,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 11:26:42,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +18: [2023-04-29 11:26:42,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +57: [2023-04-29 11:26:42,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +42: [2023-04-29 11:26:42,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 11:26:42,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +40: [2023-04-29 11:26:42,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +35: [2023-04-29 11:26:42,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +40: [2023-04-29 11:26:42,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +35: [2023-04-29 11:26:42,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +40: [2023-04-29 11:26:42,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 11:26:42,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 11:26:42,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +54: [2023-04-29 11:26:42,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 11:26:42,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 11:26:42,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 6: [2023-04-29 11:26:42,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +57: [2023-04-29 11:26:42,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +57: [2023-04-29 11:26:42,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +37: [2023-04-29 11:26:42,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +37: [2023-04-29 11:26:42,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +42: [2023-04-29 11:26:42,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +20: [2023-04-29 11:26:42,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +49: [2023-04-29 11:26:42,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +28: [2023-04-29 11:26:42,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +35: [2023-04-29 11:26:42,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 11:26:42,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +14: [2023-04-29 11:26:42,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 11:26:42,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +23: [2023-04-29 11:26:42,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +42: [2023-04-29 11:26:42,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +41: [2023-04-29 11:26:42,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 11:26:42,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +17: [2023-04-29 11:26:42,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 11:26:42,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 11:26:42,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +22: [2023-04-29 11:26:42,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +41: [2023-04-29 11:26:42,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +29: [2023-04-29 11:26:42,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 11:26:42,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +28: [2023-04-29 11:26:42,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +49: [2023-04-29 11:26:42,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 11:26:42,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +28: [2023-04-29 11:26:42,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +53: [2023-04-29 11:26:42,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +29: [2023-04-29 11:26:42,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:42,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +22: [2023-04-29 11:26:42,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +35: [2023-04-29 11:26:42,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +24: [2023-04-29 11:26:42,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 11:26:42,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +28: [2023-04-29 11:26:42,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +36: [2023-04-29 11:26:42,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +36: [2023-04-29 11:26:42,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +53: [2023-04-29 11:26:42,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 11:26:42,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +29: [2023-04-29 11:26:42,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +53: [2023-04-29 11:26:42,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +28: [2023-04-29 11:26:42,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +28: [2023-04-29 11:26:42,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +53: [2023-04-29 11:26:42,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +24: [2023-04-29 11:26:42,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +14: [2023-04-29 11:26:42,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 11:26:42,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 11:26:42,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +58: [2023-04-29 11:26:42,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 11:26:42,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 11:26:42,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 11:26:42,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +36: [2023-04-29 11:26:42,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +55: [2023-04-29 11:26:42,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +46: [2023-04-29 11:26:42,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 11:26:42,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +58: [2023-04-29 11:26:42,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +17: [2023-04-29 11:26:42,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +58: [2023-04-29 11:26:42,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +59: [2023-04-29 11:26:42,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 11:26:42,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +49: [2023-04-29 11:26:42,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 11:26:42,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +59: [2023-04-29 11:26:42,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +59: [2023-04-29 11:26:42,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +30: [2023-04-29 11:26:42,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 11:26:42,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 11:26:42,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 11:26:42,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 11:26:42,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +52: [2023-04-29 11:26:42,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +49: [2023-04-29 11:26:42,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 11:26:42,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +30: [2023-04-29 11:26:42,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +52: [2023-04-29 11:26:42,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 11:26:42,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +20: [2023-04-29 11:26:42,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +55: [2023-04-29 11:26:42,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +28: [2023-04-29 11:26:42,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 11:26:42,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +46: [2023-04-29 11:26:42,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 11:26:42,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +30: [2023-04-29 11:26:42,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +59: [2023-04-29 11:26:42,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 11:26:42,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +30: [2023-04-29 11:26:42,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 11:26:42,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +30: [2023-04-29 11:26:42,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +52: [2023-04-29 11:26:42,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +52: [2023-04-29 11:26:42,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +30: [2023-04-29 11:26:42,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +30: [2023-04-29 11:26:42,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +30: [2023-04-29 11:26:42,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 11:26:42,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +58: [2023-04-29 11:26:42,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 4: [2023-04-29 11:26:42,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +63: [2023-04-29 11:26:42,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 11:26:42,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 11:26:42,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 11:26:42,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 11:26:42,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 11:26:42,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +60: [2023-04-29 11:26:42,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +30: [2023-04-29 11:26:42,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 11:26:42,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +58: [2023-04-29 11:26:42,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +20: [2023-04-29 11:26:42,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +30: [2023-04-29 11:26:42,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +20: [2023-04-29 11:26:42,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +17: [2023-04-29 11:26:42,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +60: [2023-04-29 11:26:42,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 11:26:42,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 11:26:42,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +40: [2023-04-29 11:26:42,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +40: [2023-04-29 11:26:42,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 11:26:42,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 11:26:42,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +22: [2023-04-29 11:26:42,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 11:26:42,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +30: [2023-04-29 11:26:42,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +10: [2023-04-29 11:26:42,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 11:26:42,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +57: [2023-04-29 11:26:42,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +10: [2023-04-29 11:26:42,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +57: [2023-04-29 11:26:42,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +10: [2023-04-29 11:26:42,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +53: [2023-04-29 11:26:42,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 11:26:42,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +28: [2023-04-29 11:26:42,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +46: [2023-04-29 11:26:42,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 11:26:42,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 11:26:42,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 11:26:42,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 11:26:42,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 11:26:42,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +60: [2023-04-29 11:26:42,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +40: [2023-04-29 11:26:42,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 11:26:42,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +57: [2023-04-29 11:26:42,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 11:26:42,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +63: [2023-04-29 11:26:42,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +53: [2023-04-29 11:26:42,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 11:26:42,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +49: [2023-04-29 11:26:42,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 11:26:42,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 11:26:42,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 11:26:42,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +14: [2023-04-29 11:26:42,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 11:26:42,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 11:26:42,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 11:26:42,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +10: [2023-04-29 11:26:42,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 4: [2023-04-29 11:26:42,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +36: [2023-04-29 11:26:42,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +40: [2023-04-29 11:26:42,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +63: [2023-04-29 11:26:42,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +60: [2023-04-29 11:26:42,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 11:26:42,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +28: [2023-04-29 11:26:42,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +40: [2023-04-29 11:26:42,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +10: [2023-04-29 11:26:42,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +56: [2023-04-29 11:26:42,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +61: [2023-04-29 11:26:42,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +49: [2023-04-29 11:26:42,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +14: [2023-04-29 11:26:42,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +36: [2023-04-29 11:26:42,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +35: [2023-04-29 11:26:42,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 11:26:42,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 11:26:42,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 11:26:42,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 11:26:42,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 11:26:42,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +61: [2023-04-29 11:26:42,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +47: [2023-04-29 11:26:42,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +14: [2023-04-29 11:26:42,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 11:26:42,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +36: [2023-04-29 11:26:42,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +46: [2023-04-29 11:26:42,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +25: [2023-04-29 11:26:42,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +28: [2023-04-29 11:26:42,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 11:26:42,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +28: [2023-04-29 11:26:42,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 11:26:42,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 11:26:42,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +47: [2023-04-29 11:26:42,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +28: [2023-04-29 11:26:42,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 11:26:42,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +23: [2023-04-29 11:26:42,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +23: [2023-04-29 11:26:42,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +58: [2023-04-29 11:26:42,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +52: [2023-04-29 11:26:42,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 11:26:42,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 11:26:42,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 11:26:42,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +20: [2023-04-29 11:26:42,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +35: [2023-04-29 11:26:42,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +47: [2023-04-29 11:26:42,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 11:26:42,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +14: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +44: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 1: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 1: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +52: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +25: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +21: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +21: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +21: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 1: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +21: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +47: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +17: [2023-04-29 11:26:42,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 11:26:42,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +35: [2023-04-29 11:26:42,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +35: [2023-04-29 11:26:42,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +35: [2023-04-29 11:26:42,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +57: [2023-04-29 11:26:42,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 4: [2023-04-29 11:26:42,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +46: [2023-04-29 11:26:42,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +23: [2023-04-29 11:26:42,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +23: [2023-04-29 11:26:42,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +20: [2023-04-29 11:26:42,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 11:26:42,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +25: [2023-04-29 11:26:42,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 11:26:42,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +16: [2023-04-29 11:26:42,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +47: [2023-04-29 11:26:42,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +47: [2023-04-29 11:26:42,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +25: [2023-04-29 11:26:42,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +63: [2023-04-29 11:26:42,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +11: [2023-04-29 11:26:42,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +11: [2023-04-29 11:26:42,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +11: [2023-04-29 11:26:42,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +11: [2023-04-29 11:26:42,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +39: [2023-04-29 11:26:42,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +23: [2023-04-29 11:26:42,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +63: [2023-04-29 11:26:42,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +46: [2023-04-29 11:26:42,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +16: [2023-04-29 11:26:42,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +13: [2023-04-29 11:26:42,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +13: [2023-04-29 11:26:42,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +44: [2023-04-29 11:26:42,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +48: [2023-04-29 11:26:42,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 11:26:42,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +16: [2023-04-29 11:26:42,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 2: [2023-04-29 11:26:42,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 2: [2023-04-29 11:26:42,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 2: [2023-04-29 11:26:42,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 2: [2023-04-29 11:26:42,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +23: [2023-04-29 11:26:42,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +39: [2023-04-29 11:26:42,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 11:26:42,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 11:26:42,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +56: [2023-04-29 11:26:42,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +52: [2023-04-29 11:26:42,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 11:26:42,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +52: [2023-04-29 11:26:42,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 11:26:42,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +56: [2023-04-29 11:26:42,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +47: [2023-04-29 11:26:42,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +17: [2023-04-29 11:26:42,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +58: [2023-04-29 11:26:42,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 11:26:42,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +48: [2023-04-29 11:26:42,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +25: [2023-04-29 11:26:42,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +16: [2023-04-29 11:26:42,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +56: [2023-04-29 11:26:42,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 11:26:42,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +25: [2023-04-29 11:26:42,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +13: [2023-04-29 11:26:42,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +13: [2023-04-29 11:26:42,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 4: [2023-04-29 11:26:42,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +25: [2023-04-29 11:26:42,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +40: [2023-04-29 11:26:42,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +23: [2023-04-29 11:26:42,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 4: [2023-04-29 11:26:42,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +61: [2023-04-29 11:26:42,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +39: [2023-04-29 11:26:42,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 11:26:42,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +16: [2023-04-29 11:26:42,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 5: [2023-04-29 11:26:42,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +23: [2023-04-29 11:26:42,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 5: [2023-04-29 11:26:42,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 5: [2023-04-29 11:26:42,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 4: [2023-04-29 11:26:42,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 4: [2023-04-29 11:26:42,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +14: [2023-04-29 11:26:42,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +14: [2023-04-29 11:26:42,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +14: [2023-04-29 11:26:42,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +16: [2023-04-29 11:26:42,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +62: [2023-04-29 11:26:42,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 11:26:42,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 11:26:42,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +14: [2023-04-29 11:26:42,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +20: [2023-04-29 11:26:42,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +62: [2023-04-29 11:26:42,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 11:26:42,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +16: [2023-04-29 11:26:42,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +57: [2023-04-29 11:26:42,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 11:26:42,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +12: [2023-04-29 11:26:42,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +12: [2023-04-29 11:26:42,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +40: [2023-04-29 11:26:42,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +46: [2023-04-29 11:26:42,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 11:26:42,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 11:26:42,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 11:26:42,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +44: [2023-04-29 11:26:42,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 11:26:42,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 11:26:42,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 11:26:42,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +17: [2023-04-29 11:26:42,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +17: [2023-04-29 11:26:42,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +54: [2023-04-29 11:26:42,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 11:26:42,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 11:26:42,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 11:26:42,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 11:26:42,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +20: [2023-04-29 11:26:42,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +62: [2023-04-29 11:26:42,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 11:26:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +58: [2023-04-29 11:26:42,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 11:26:42,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +12: [2023-04-29 11:26:42,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +12: [2023-04-29 11:26:42,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +48: [2023-04-29 11:26:42,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 11:26:42,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 11:26:42,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +17: [2023-04-29 11:26:42,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +61: [2023-04-29 11:26:42,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 11:26:42,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +61: [2023-04-29 11:26:42,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 11:26:42,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +57: [2023-04-29 11:26:42,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 11:26:42,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... + 9: [2023-04-29 11:26:42,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +56: [2023-04-29 11:26:42,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 11:26:42,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +29: [2023-04-29 11:26:42,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +40: [2023-04-29 11:26:42,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +40: [2023-04-29 11:26:42,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +40: [2023-04-29 11:26:42,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 11:26:42,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 11:26:42,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 11:26:42,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 11:26:42,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +49: [2023-04-29 11:26:42,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +49: [2023-04-29 11:26:42,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +55: [2023-04-29 11:26:42,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +49: [2023-04-29 11:26:42,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +49: [2023-04-29 11:26:42,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_26-model_01-model_states.pt. +21: [2023-04-29 11:26:42,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +21: [2023-04-29 11:26:42,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +11: [2023-04-29 11:26:42,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +29: [2023-04-29 11:26:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +42: [2023-04-29 11:26:42,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +29: [2023-04-29 11:26:42,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +21: [2023-04-29 11:26:42,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +40: [2023-04-29 11:26:42,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +40: [2023-04-29 11:26:42,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +40: [2023-04-29 11:26:42,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +13: [2023-04-29 11:26:42,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 11:26:42,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:42,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +44: [2023-04-29 11:26:42,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +39: [2023-04-29 11:26:42,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +16: [2023-04-29 11:26:42,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +44: [2023-04-29 11:26:42,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +16: [2023-04-29 11:26:42,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +42: [2023-04-29 11:26:42,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 11:26:42,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +42: [2023-04-29 11:26:42,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +35: [2023-04-29 11:26:42,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +13: [2023-04-29 11:26:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 11:26:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 11:26:42,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +39: [2023-04-29 11:26:42,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +42: [2023-04-29 11:26:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +14: [2023-04-29 11:26:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +14: [2023-04-29 11:26:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +39: [2023-04-29 11:26:42,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +29: [2023-04-29 11:26:42,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +14: [2023-04-29 11:26:42,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 11:26:42,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +35: [2023-04-29 11:26:42,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 11:26:42,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +11: [2023-04-29 11:26:42,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +29: [2023-04-29 11:26:42,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +42: [2023-04-29 11:26:42,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... + 2: [2023-04-29 11:26:42,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +42: [2023-04-29 11:26:42,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 11:26:42,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... + 9: [2023-04-29 11:26:42,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 11:26:42,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +12: [2023-04-29 11:26:42,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 11:26:42,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +54: [2023-04-29 11:26:42,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +16: [2023-04-29 11:26:42,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +54: [2023-04-29 11:26:42,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +11: [2023-04-29 11:26:42,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +11: [2023-04-29 11:26:42,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +42: [2023-04-29 11:26:42,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +39: [2023-04-29 11:26:42,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 11:26:42,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +35: [2023-04-29 11:26:42,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 11:26:42,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 11:26:42,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +54: [2023-04-29 11:26:42,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 11:26:42,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 11:26:42,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +30: [2023-04-29 11:26:42,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 11:26:42,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 11:26:42,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 11:26:42,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +17: [2023-04-29 11:26:42,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +36: [2023-04-29 11:26:42,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 11:26:42,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +35: [2023-04-29 11:26:42,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +16: [2023-04-29 11:26:42,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +16: [2023-04-29 11:26:42,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +16: [2023-04-29 11:26:42,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 11:26:42,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +14: [2023-04-29 11:26:42,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +30: [2023-04-29 11:26:42,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +40: [2023-04-29 11:26:42,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +36: [2023-04-29 11:26:42,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +17: [2023-04-29 11:26:42,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +32: [2023-04-29 11:26:42,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 11:26:42,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 11:26:42,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +36: [2023-04-29 11:26:42,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +32: [2023-04-29 11:26:42,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 11:26:42,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 11:26:42,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 11:26:42,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +40: [2023-04-29 11:26:42,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +42: [2023-04-29 11:26:42,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +55: [2023-04-29 11:26:42,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +55: [2023-04-29 11:26:42,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +36: [2023-04-29 11:26:42,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +49: [2023-04-29 11:26:42,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 11:26:42,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +36: [2023-04-29 11:26:42,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +49: [2023-04-29 11:26:42,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +49: [2023-04-29 11:26:42,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +36: [2023-04-29 11:26:42,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 11:26:42,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +22: [2023-04-29 11:26:42,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 4: [2023-04-29 11:26:42,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +49: [2023-04-29 11:26:42,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +32: [2023-04-29 11:26:42,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 11:26:42,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +28: [2023-04-29 11:26:42,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +32: [2023-04-29 11:26:42,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 11:26:42,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +28: [2023-04-29 11:26:42,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +28: [2023-04-29 11:26:42,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +28: [2023-04-29 11:26:42,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +40: [2023-04-29 11:26:42,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 11:26:42,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +55: [2023-04-29 11:26:42,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +36: [2023-04-29 11:26:42,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... + 8: [2023-04-29 11:26:42,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 11:26:42,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 8: [2023-04-29 11:26:42,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 11:26:42,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 11:26:42,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 11:26:42,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 11:26:42,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +60: [2023-04-29 11:26:42,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 11:26:42,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +22: [2023-04-29 11:26:42,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 11:26:42,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +28: [2023-04-29 11:26:42,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +28: [2023-04-29 11:26:42,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +40: [2023-04-29 11:26:42,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +19: [2023-04-29 11:26:42,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 11:26:42,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +35: [2023-04-29 11:26:42,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +19: [2023-04-29 11:26:42,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 11:26:42,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 11:26:42,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 3: [2023-04-29 11:26:42,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +35: [2023-04-29 11:26:42,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +22: [2023-04-29 11:26:42,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +27: [2023-04-29 11:26:42,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +27: [2023-04-29 11:26:42,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +27: [2023-04-29 11:26:42,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +27: [2023-04-29 11:26:42,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +30: [2023-04-29 11:26:42,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +40: [2023-04-29 11:26:42,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +30: [2023-04-29 11:26:42,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 3: [2023-04-29 11:26:42,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +30: [2023-04-29 11:26:42,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. +40: [2023-04-29 11:26:42,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +30: [2023-04-29 11:26:42,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_04-model_01-model_states.pt. + 7: [2023-04-29 11:26:42,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +62: [2023-04-29 11:26:42,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 11:26:42,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +51: [2023-04-29 11:26:42,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +51: [2023-04-29 11:26:42,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. + 3: [2023-04-29 11:26:42,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 11:26:42,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +51: [2023-04-29 11:26:42,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +51: [2023-04-29 11:26:42,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. + 0: [2023-04-29 11:26:42,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +60: [2023-04-29 11:26:42,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 11:26:42,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 11:26:42,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 11:26:42,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 11:26:42,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 11:26:42,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 11:26:42,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 11:26:42,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 11:26:42,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 11:26:42,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 4: [2023-04-29 11:26:42,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +22: [2023-04-29 11:26:42,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +40: [2023-04-29 11:26:42,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +62: [2023-04-29 11:26:42,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +62: [2023-04-29 11:26:42,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +62: [2023-04-29 11:26:42,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +62: [2023-04-29 11:26:42,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. + 1: [2023-04-29 11:26:42,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +62: [2023-04-29 11:26:42,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 11:26:42,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 11:26:42,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 11:26:42,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +60: [2023-04-29 11:26:42,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +13: [2023-04-29 11:26:42,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 11:26:42,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 11:26:42,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 11:26:42,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +11: [2023-04-29 11:26:42,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +22: [2023-04-29 11:26:42,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +22: [2023-04-29 11:26:42,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 11:26:42,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +60: [2023-04-29 11:26:42,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +21: [2023-04-29 11:26:42,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +22: [2023-04-29 11:26:42,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 3: [2023-04-29 11:26:42,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 11:26:42,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +11: [2023-04-29 11:26:42,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 1: [2023-04-29 11:26:42,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 1: [2023-04-29 11:26:42,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +60: [2023-04-29 11:26:42,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 11:26:42,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +21: [2023-04-29 11:26:42,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 11:26:42,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 11:26:42,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 11:26:42,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 11:26:42,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 11:26:42,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:42,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 11:26:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 11:26:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 11:26:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:42,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +12: [2023-04-29 11:26:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +12: [2023-04-29 11:26:42,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 4: [2023-04-29 11:26:42,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 11:26:42,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 11:26:42,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 11:26:42,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:42,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +27: [2023-04-29 11:26:42,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +13: [2023-04-29 11:26:42,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +21: [2023-04-29 11:26:42,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +21: [2023-04-29 11:26:42,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +14: [2023-04-29 11:26:42,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +11: [2023-04-29 11:26:42,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +14: [2023-04-29 11:26:42,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +14: [2023-04-29 11:26:42,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 4: [2023-04-29 11:26:42,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +51: [2023-04-29 11:26:42,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 11:26:42,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +17: [2023-04-29 11:26:42,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 11:26:42,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +62: [2023-04-29 11:26:42,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 11:26:42,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +16: [2023-04-29 11:26:42,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +21: [2023-04-29 11:26:42,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +12: [2023-04-29 11:26:42,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +12: [2023-04-29 11:26:42,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 3: [2023-04-29 11:26:42,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +16: [2023-04-29 11:26:42,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +12: [2023-04-29 11:26:42,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 4: [2023-04-29 11:26:42,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +16: [2023-04-29 11:26:42,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +51: [2023-04-29 11:26:42,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 11:26:42,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +11: [2023-04-29 11:26:42,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 5: [2023-04-29 11:26:42,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 11:26:42,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +13: [2023-04-29 11:26:42,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +13: [2023-04-29 11:26:42,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +11: [2023-04-29 11:26:42,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +49: [2023-04-29 11:26:42,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +11: [2023-04-29 11:26:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +13: [2023-04-29 11:26:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 11:26:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt... +45: [2023-04-29 11:26:42,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 11:26:42,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +16: [2023-04-29 11:26:42,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +12: [2023-04-29 11:26:42,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +62: [2023-04-29 11:26:42,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 11:26:42,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +14: [2023-04-29 11:26:42,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +17: [2023-04-29 11:26:42,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +17: [2023-04-29 11:26:42,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +49: [2023-04-29 11:26:42,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +61: [2023-04-29 11:26:42,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +61: [2023-04-29 11:26:42,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. + 5: [2023-04-29 11:26:42,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +32: [2023-04-29 11:26:42,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +61: [2023-04-29 11:26:42,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +32: [2023-04-29 11:26:42,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +62: [2023-04-29 11:26:42,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 11:26:42,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 11:26:42,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 11:26:42,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 11:26:42,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 11:26:42,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 11:26:42,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 11:26:42,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 11:26:42,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +61: [2023-04-29 11:26:42,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +49: [2023-04-29 11:26:42,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +11: [2023-04-29 11:26:42,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +13: [2023-04-29 11:26:42,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 5: [2023-04-29 11:26:42,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +17: [2023-04-29 11:26:42,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +45: [2023-04-29 11:26:42,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +11: [2023-04-29 11:26:42,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +32: [2023-04-29 11:26:42,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +62: [2023-04-29 11:26:42,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +16: [2023-04-29 11:26:42,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +49: [2023-04-29 11:26:42,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +32: [2023-04-29 11:26:42,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +19: [2023-04-29 11:26:42,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 2: [2023-04-29 11:26:42,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 2: [2023-04-29 11:26:42,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 2: [2023-04-29 11:26:42,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 8: [2023-04-29 11:26:42,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +45: [2023-04-29 11:26:42,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +49: [2023-04-29 11:26:42,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +45: [2023-04-29 11:26:42,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +14: [2023-04-29 11:26:42,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +49: [2023-04-29 11:26:42,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +62: [2023-04-29 11:26:42,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +45: [2023-04-29 11:26:42,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +45: [2023-04-29 11:26:42,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt... +62: [2023-04-29 11:26:42,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 11:26:42,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 11:26:42,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +45: [2023-04-29 11:26:42,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +49: [2023-04-29 11:26:42,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt... +19: [2023-04-29 11:26:42,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 11:26:42,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 11:26:42,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 11:26:42,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +36: [2023-04-29 11:26:42,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 11:26:42,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +19: [2023-04-29 11:26:42,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 11:26:42,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 11:26:42,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +36: [2023-04-29 11:26:42,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 11:26:42,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 11:26:42,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 11:26:42,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 11:26:42,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 11:26:42,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 11:26:42,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +36: [2023-04-29 11:26:42,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 11:26:42,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 11:26:42,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 11:26:42,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 11:26:42,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +32: [2023-04-29 11:26:42,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 11:26:42,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 11:26:42,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 11:26:42,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 11:26:42,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 11:26:42,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 11:26:42,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +19: [2023-04-29 11:26:42,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +43: [2023-04-29 11:26:42,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 11:26:42,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +13: [2023-04-29 11:26:42,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 11:26:42,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +43: [2023-04-29 11:26:42,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 11:26:42,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 11:26:42,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 11:26:42,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 11:26:42,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 11:26:42,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 11:26:42,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +32: [2023-04-29 11:26:42,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +43: [2023-04-29 11:26:42,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 11:26:42,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 11:26:42,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +32: [2023-04-29 11:26:42,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +22: [2023-04-29 11:26:42,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 11:26:42,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 11:26:42,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 11:26:42,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 11:26:42,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 11:26:42,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 11:26:42,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 11:26:42,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 11:26:42,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 11:26:42,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 11:26:42,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 11:26:42,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:42,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +27: [2023-04-29 11:26:42,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +27: [2023-04-29 11:26:42,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +27: [2023-04-29 11:26:42,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 11:26:42,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:42,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 11:26:42,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 5: [2023-04-29 11:26:42,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +27: [2023-04-29 11:26:42,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:42,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +22: [2023-04-29 11:26:42,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 11:26:42,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +13: [2023-04-29 11:26:42,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_00-model_states.pt. +27: [2023-04-29 11:26:42,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +27: [2023-04-29 11:26:42,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 3: [2023-04-29 11:26:42,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 0: [2023-04-29 11:26:42,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 11:26:42,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 11:26:42,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 11:26:42,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +27: [2023-04-29 11:26:42,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +27: [2023-04-29 11:26:42,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 0: [2023-04-29 11:26:42,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 11:26:42,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... +62: [2023-04-29 11:26:42,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 3: [2023-04-29 11:26:42,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt... + 2: [2023-04-29 11:26:42,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +62: [2023-04-29 11:26:42,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 11:26:42,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 11:26:42,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +51: [2023-04-29 11:26:42,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +51: [2023-04-29 11:26:42,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... + 7: [2023-04-29 11:26:42,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 11:26:42,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +51: [2023-04-29 11:26:42,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +62: [2023-04-29 11:26:42,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +45: [2023-04-29 11:26:42,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_00-model_states.pt. +62: [2023-04-29 11:26:42,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +22: [2023-04-29 11:26:42,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 11:26:42,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 11:26:42,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +26: [2023-04-29 11:26:42,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 11:26:42,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 11:26:42,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +32: [2023-04-29 11:26:42,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 11:26:42,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 11:26:42,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 11:26:42,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +13: [2023-04-29 11:26:42,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 11:26:42,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +53: [2023-04-29 11:26:42,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +53: [2023-04-29 11:26:42,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +18: [2023-04-29 11:26:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 11:26:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 11:26:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 11:26:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +60: [2023-04-29 11:26:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +62: [2023-04-29 11:26:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 11:26:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +26: [2023-04-29 11:26:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +60: [2023-04-29 11:26:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +60: [2023-04-29 11:26:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +26: [2023-04-29 11:26:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +60: [2023-04-29 11:26:42,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +53: [2023-04-29 11:26:42,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +31: [2023-04-29 11:26:42,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 11:26:42,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 11:26:42,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +45: [2023-04-29 11:26:42,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +18: [2023-04-29 11:26:42,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 11:26:42,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 11:26:42,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 11:26:42,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 11:26:42,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 11:26:42,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 11:26:42,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 11:26:42,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +26: [2023-04-29 11:26:42,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 11:26:42,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +62: [2023-04-29 11:26:42,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +62: [2023-04-29 11:26:42,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +18: [2023-04-29 11:26:42,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 11:26:42,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 11:26:42,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 11:26:42,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +36: [2023-04-29 11:26:42,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +31: [2023-04-29 11:26:42,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 11:26:42,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 11:26:42,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 11:26:42,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 11:26:42,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 11:26:42,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 11:26:42,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 11:26:42,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 11:26:42,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 11:26:42,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 11:26:42,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 11:26:42,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +61: [2023-04-29 11:26:42,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 11:26:42,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 11:26:42,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 11:26:42,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 11:26:42,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +10: [2023-04-29 11:26:42,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 11:26:42,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 11:26:42,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 11:26:42,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +43: [2023-04-29 11:26:42,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 11:26:42,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 11:26:42,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 11:26:42,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 11:26:42,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 11:26:42,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +61: [2023-04-29 11:26:42,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 11:26:42,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 11:26:42,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +10: [2023-04-29 11:26:42,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 11:26:42,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 11:26:42,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +45: [2023-04-29 11:26:42,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 11:26:42,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 11:26:42,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +61: [2023-04-29 11:26:42,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +61: [2023-04-29 11:26:42,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +61: [2023-04-29 11:26:42,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +43: [2023-04-29 11:26:42,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +10: [2023-04-29 11:26:42,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 11:26:42,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +53: [2023-04-29 11:26:42,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 11:26:42,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 11:26:42,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 11:26:42,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 11:26:42,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +33: [2023-04-29 11:26:42,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +33: [2023-04-29 11:26:42,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +33: [2023-04-29 11:26:42,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +25: [2023-04-29 11:26:42,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 9: [2023-04-29 11:26:42,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 9: [2023-04-29 11:26:42,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 2: [2023-04-29 11:26:42,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +25: [2023-04-29 11:26:42,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +25: [2023-04-29 11:26:42,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 11:26:42,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 11:26:42,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 11:26:42,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +63: [2023-04-29 11:26:42,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 11:26:42,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 2: [2023-04-29 11:26:42,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 11:26:42,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 11:26:42,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 11:26:42,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +36: [2023-04-29 11:26:42,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 11:26:42,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 11:26:42,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +63: [2023-04-29 11:26:42,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 11:26:42,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +43: [2023-04-29 11:26:42,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 11:26:42,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 11:26:42,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +34: [2023-04-29 11:26:42,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +34: [2023-04-29 11:26:42,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +43: [2023-04-29 11:26:42,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 11:26:42,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 11:26:42,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +63: [2023-04-29 11:26:42,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 11:26:42,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 11:26:42,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 11:26:42,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 11:26:42,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 11:26:42,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +34: [2023-04-29 11:26:42,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +51: [2023-04-29 11:26:42,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 11:26:42,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +32: [2023-04-29 11:26:42,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 11:26:42,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +43: [2023-04-29 11:26:42,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 11:26:42,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 11:26:42,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 11:26:42,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +34: [2023-04-29 11:26:42,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 11:26:42,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 11:26:42,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 11:26:42,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +51: [2023-04-29 11:26:42,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +33: [2023-04-29 11:26:42,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 11:26:42,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +34: [2023-04-29 11:26:42,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 11:26:42,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +33: [2023-04-29 11:26:42,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 11:26:42,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 11:26:42,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 11:26:42,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 11:26:42,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 11:26:42,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +38: [2023-04-29 11:26:42,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +38: [2023-04-29 11:26:42,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +26: [2023-04-29 11:26:42,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 11:26:42,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 11:26:42,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 11:26:42,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 11:26:42,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +26: [2023-04-29 11:26:42,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +26: [2023-04-29 11:26:42,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +26: [2023-04-29 11:26:42,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 11:26:42,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 11:26:42,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +38: [2023-04-29 11:26:42,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 11:26:42,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 11:26:42,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 11:26:42,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 11:26:42,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 11:26:42,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +38: [2023-04-29 11:26:42,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +11: [2023-04-29 11:26:42,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +38: [2023-04-29 11:26:42,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +27: [2023-04-29 11:26:42,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 11:26:42,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 11:26:42,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 11:26:42,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 11:26:42,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 11:26:42,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +38: [2023-04-29 11:26:42,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +38: [2023-04-29 11:26:42,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +11: [2023-04-29 11:26:42,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +41: [2023-04-29 11:26:42,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +41: [2023-04-29 11:26:42,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +41: [2023-04-29 11:26:42,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +41: [2023-04-29 11:26:42,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +11: [2023-04-29 11:26:42,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +11: [2023-04-29 11:26:42,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 11:26:42,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +11: [2023-04-29 11:26:42,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 11:26:42,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 11:26:42,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 11:26:42,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 11:26:42,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +54: [2023-04-29 11:26:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +54: [2023-04-29 11:26:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +54: [2023-04-29 11:26:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +12: [2023-04-29 11:26:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 11:26:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +54: [2023-04-29 11:26:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +12: [2023-04-29 11:26:42,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 11:26:42,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 11:26:42,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 11:26:42,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 11:26:42,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 11:26:42,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 11:26:42,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 11:26:42,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 11:26:42,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 11:26:42,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 11:26:42,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +12: [2023-04-29 11:26:42,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +12: [2023-04-29 11:26:42,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 11:26:42,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 11:26:42,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +53: [2023-04-29 11:26:42,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +12: [2023-04-29 11:26:42,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 11:26:42,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 11:26:42,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +33: [2023-04-29 11:26:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 11:26:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 11:26:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 11:26:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +18: [2023-04-29 11:26:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 11:26:42,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 11:26:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +29: [2023-04-29 11:26:42,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +60: [2023-04-29 11:26:42,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +29: [2023-04-29 11:26:42,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +39: [2023-04-29 11:26:42,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +39: [2023-04-29 11:26:42,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 11:26:42,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 11:26:42,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +39: [2023-04-29 11:26:42,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +26: [2023-04-29 11:26:42,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 11:26:42,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 11:26:42,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 11:26:42,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +33: [2023-04-29 11:26:42,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 11:26:42,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +17: [2023-04-29 11:26:42,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 11:26:42,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 11:26:42,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +33: [2023-04-29 11:26:42,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +10: [2023-04-29 11:26:42,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +23: [2023-04-29 11:26:42,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +23: [2023-04-29 11:26:42,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +60: [2023-04-29 11:26:42,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +37: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +18: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +53: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +39: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +10: [2023-04-29 11:26:42,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +39: [2023-04-29 11:26:42,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +39: [2023-04-29 11:26:42,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +26: [2023-04-29 11:26:42,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 11:26:42,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 11:26:42,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 11:26:42,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 11:26:42,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +39: [2023-04-29 11:26:42,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +31: [2023-04-29 11:26:42,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +23: [2023-04-29 11:26:42,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +23: [2023-04-29 11:26:42,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 11:26:42,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 11:26:42,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 11:26:42,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 11:26:42,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +60: [2023-04-29 11:26:42,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +31: [2023-04-29 11:26:42,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +37: [2023-04-29 11:26:42,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +17: [2023-04-29 11:26:42,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +15: [2023-04-29 11:26:42,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 11:26:42,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +37: [2023-04-29 11:26:42,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 11:26:42,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 11:26:42,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +23: [2023-04-29 11:26:42,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 11:26:42,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 11:26:42,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +53: [2023-04-29 11:26:42,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +23: [2023-04-29 11:26:42,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +41: [2023-04-29 11:26:42,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 11:26:42,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +23: [2023-04-29 11:26:42,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +41: [2023-04-29 11:26:42,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 11:26:42,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +23: [2023-04-29 11:26:42,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +54: [2023-04-29 11:26:42,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 11:26:42,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 11:26:42,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 11:26:42,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +54: [2023-04-29 11:26:42,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +10: [2023-04-29 11:26:42,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +54: [2023-04-29 11:26:42,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 11:26:42,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +53: [2023-04-29 11:26:42,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 11:26:42,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 11:26:42,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +55: [2023-04-29 11:26:42,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +53: [2023-04-29 11:26:42,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +10: [2023-04-29 11:26:42,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 11:26:42,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +24: [2023-04-29 11:26:42,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 11:26:42,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 11:26:42,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 11:26:42,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 11:26:42,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +55: [2023-04-29 11:26:42,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 11:26:42,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 11:26:42,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 11:26:42,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 11:26:42,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +34: [2023-04-29 11:26:42,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 11:26:42,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 11:26:42,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 11:26:42,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 11:26:42,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 11:26:42,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +24: [2023-04-29 11:26:42,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +24: [2023-04-29 11:26:42,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +51: [2023-04-29 11:26:42,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +24: [2023-04-29 11:26:42,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +24: [2023-04-29 11:26:42,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +63: [2023-04-29 11:26:42,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 9: [2023-04-29 11:26:42,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +51: [2023-04-29 11:26:42,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 11:26:42,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +14: [2023-04-29 11:26:42,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 11:26:42,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 11:26:42,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 11:26:42,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 11:26:42,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 11:26:42,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +34: [2023-04-29 11:26:42,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 11:26:42,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 11:26:42,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 11:26:42,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 11:26:42,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 11:26:42,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +34: [2023-04-29 11:26:42,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +20: [2023-04-29 11:26:42,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 11:26:42,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +51: [2023-04-29 11:26:42,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +20: [2023-04-29 11:26:42,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +47: [2023-04-29 11:26:42,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +47: [2023-04-29 11:26:42,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +20: [2023-04-29 11:26:42,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 11:26:42,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +47: [2023-04-29 11:26:42,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +47: [2023-04-29 11:26:42,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +14: [2023-04-29 11:26:42,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +14: [2023-04-29 11:26:42,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +14: [2023-04-29 11:26:42,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +14: [2023-04-29 11:26:42,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 11:26:42,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +43: [2023-04-29 11:26:42,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +20: [2023-04-29 11:26:42,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +20: [2023-04-29 11:26:42,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 11:26:42,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +20: [2023-04-29 11:26:42,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 11:26:42,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +20: [2023-04-29 11:26:42,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 9: [2023-04-29 11:26:42,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +11: [2023-04-29 11:26:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +47: [2023-04-29 11:26:42,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 11:26:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 11:26:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 11:26:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 11:26:42,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 11:26:42,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 11:26:42,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 6: [2023-04-29 11:26:42,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +50: [2023-04-29 11:26:42,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 11:26:42,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 11:26:42,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +38: [2023-04-29 11:26:42,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +38: [2023-04-29 11:26:42,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 11:26:42,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 11:26:42,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +34: [2023-04-29 11:26:42,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +24: [2023-04-29 11:26:42,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +24: [2023-04-29 11:26:42,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +24: [2023-04-29 11:26:42,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +24: [2023-04-29 11:26:42,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +21: [2023-04-29 11:26:42,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 8: [2023-04-29 11:26:42,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 8: [2023-04-29 11:26:42,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 8: [2023-04-29 11:26:42,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +47: [2023-04-29 11:26:42,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +38: [2023-04-29 11:26:42,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +31: [2023-04-29 11:26:42,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +31: [2023-04-29 11:26:42,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +31: [2023-04-29 11:26:42,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 6: [2023-04-29 11:26:42,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 11:26:42,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 11:26:42,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +33: [2023-04-29 11:26:42,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +33: [2023-04-29 11:26:42,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +33: [2023-04-29 11:26:42,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +33: [2023-04-29 11:26:42,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... + 6: [2023-04-29 11:26:42,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 11:26:42,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +11: [2023-04-29 11:26:42,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 11:26:42,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 11:26:42,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 11:26:42,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 11:26:42,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +51: [2023-04-29 11:26:42,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +52: [2023-04-29 11:26:42,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +52: [2023-04-29 11:26:42,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +63: [2023-04-29 11:26:42,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +63: [2023-04-29 11:26:42,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 11:26:42,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 11:26:42,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +63: [2023-04-29 11:26:42,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 11:26:42,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 11:26:42,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +52: [2023-04-29 11:26:42,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +29: [2023-04-29 11:26:42,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +52: [2023-04-29 11:26:42,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +39: [2023-04-29 11:26:42,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 11:26:42,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 11:26:42,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 11:26:42,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 11:26:42,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 11:26:42,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +34: [2023-04-29 11:26:42,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +21: [2023-04-29 11:26:42,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 11:26:42,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +51: [2023-04-29 11:26:42,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 11:26:42,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +11: [2023-04-29 11:26:42,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 11:26:42,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +61: [2023-04-29 11:26:42,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 11:26:42,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 11:26:42,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 11:26:42,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +33: [2023-04-29 11:26:42,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +24: [2023-04-29 11:26:42,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +61: [2023-04-29 11:26:42,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 11:26:42,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +17: [2023-04-29 11:26:42,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +39: [2023-04-29 11:26:42,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +39: [2023-04-29 11:26:42,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +29: [2023-04-29 11:26:42,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +43: [2023-04-29 11:26:42,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 11:26:42,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 11:26:42,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 11:26:42,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +21: [2023-04-29 11:26:42,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +37: [2023-04-29 11:26:42,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +17: [2023-04-29 11:26:42,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +38: [2023-04-29 11:26:42,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 11:26:42,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +33: [2023-04-29 11:26:42,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 11:26:42,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 11:26:42,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 11:26:42,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 11:26:42,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +39: [2023-04-29 11:26:42,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +29: [2023-04-29 11:26:42,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 11:26:42,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +31: [2023-04-29 11:26:42,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +23: [2023-04-29 11:26:42,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +54: [2023-04-29 11:26:42,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 11:26:42,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +31: [2023-04-29 11:26:42,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +24: [2023-04-29 11:26:42,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 11:26:42,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +37: [2023-04-29 11:26:42,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 11:26:42,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +31: [2023-04-29 11:26:42,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +23: [2023-04-29 11:26:42,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +23: [2023-04-29 11:26:42,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +33: [2023-04-29 11:26:42,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 11:26:42,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +24: [2023-04-29 11:26:42,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +24: [2023-04-29 11:26:42,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 11:26:42,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 11:26:42,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +38: [2023-04-29 11:26:42,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +54: [2023-04-29 11:26:42,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 11:26:42,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +54: [2023-04-29 11:26:42,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +21: [2023-04-29 11:26:42,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +33: [2023-04-29 11:26:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 0: [2023-04-29 11:26:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 0: [2023-04-29 11:26:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 0: [2023-04-29 11:26:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 7: [2023-04-29 11:26:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 7: [2023-04-29 11:26:42,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +54: [2023-04-29 11:26:42,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 11:26:42,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +54: [2023-04-29 11:26:42,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +54: [2023-04-29 11:26:42,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +52: [2023-04-29 11:26:42,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +23: [2023-04-29 11:26:42,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +54: [2023-04-29 11:26:42,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +54: [2023-04-29 11:26:42,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 11:26:42,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +11: [2023-04-29 11:26:42,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +52: [2023-04-29 11:26:42,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 11:26:42,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:42,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +52: [2023-04-29 11:26:42,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 11:26:42,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 11:26:42,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +11: [2023-04-29 11:26:42,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 11:26:42,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 11:26:42,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +11: [2023-04-29 11:26:42,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +52: [2023-04-29 11:26:42,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 11:26:42,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +12: [2023-04-29 11:26:42,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 11:26:42,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 11:26:42,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +28: [2023-04-29 11:26:42,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 11:26:42,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 11:26:42,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 11:26:42,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +52: [2023-04-29 11:26:42,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 11:26:42,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 11:26:42,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 11:26:42,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +33: [2023-04-29 11:26:42,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +21: [2023-04-29 11:26:42,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +54: [2023-04-29 11:26:42,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +21: [2023-04-29 11:26:42,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +52: [2023-04-29 11:26:42,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +52: [2023-04-29 11:26:42,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +53: [2023-04-29 11:26:42,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 11:26:42,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 11:26:42,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 11:26:42,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 11:26:42,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +34: [2023-04-29 11:26:42,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +17: [2023-04-29 11:26:42,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +39: [2023-04-29 11:26:42,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 11:26:42,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 11:26:42,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 11:26:42,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 11:26:42,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 11:26:42,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 11:26:42,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +55: [2023-04-29 11:26:42,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +34: [2023-04-29 11:26:42,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 11:26:42,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +54: [2023-04-29 11:26:42,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... + 1: [2023-04-29 11:26:42,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 11:26:42,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 11:26:42,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 1: [2023-04-29 11:26:42,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 1: [2023-04-29 11:26:42,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 11:26:42,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +39: [2023-04-29 11:26:42,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +39: [2023-04-29 11:26:42,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 11:26:42,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +17: [2023-04-29 11:26:42,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +20: [2023-04-29 11:26:42,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 11:26:42,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +53: [2023-04-29 11:26:42,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +23: [2023-04-29 11:26:42,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 11:26:42,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 11:26:42,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:42,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +23: [2023-04-29 11:26:42,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 11:26:42,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +41: [2023-04-29 11:26:42,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 11:26:42,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +23: [2023-04-29 11:26:42,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +20: [2023-04-29 11:26:42,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +41: [2023-04-29 11:26:42,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 11:26:42,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 11:26:42,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +41: [2023-04-29 11:26:42,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +41: [2023-04-29 11:26:42,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +41: [2023-04-29 11:26:42,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 11:26:42,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 11:26:42,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 11:26:42,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 11:26:42,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 11:26:42,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +49: [2023-04-29 11:26:42,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 11:26:42,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +20: [2023-04-29 11:26:42,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 11:26:42,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +49: [2023-04-29 11:26:42,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +49: [2023-04-29 11:26:42,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +33: [2023-04-29 11:26:42,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +14: [2023-04-29 11:26:42,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 11:26:42,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +14: [2023-04-29 11:26:42,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 11:26:42,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +41: [2023-04-29 11:26:42,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 11:26:42,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 11:26:42,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 11:26:42,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +41: [2023-04-29 11:26:42,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +41: [2023-04-29 11:26:42,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 11:26:42,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +47: [2023-04-29 11:26:42,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +41: [2023-04-29 11:26:42,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +23: [2023-04-29 11:26:42,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +35: [2023-04-29 11:26:42,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +35: [2023-04-29 11:26:42,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +35: [2023-04-29 11:26:42,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +59: [2023-04-29 11:26:42,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 11:26:42,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 11:26:42,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 11:26:42,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 11:26:42,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 11:26:42,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +41: [2023-04-29 11:26:42,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +35: [2023-04-29 11:26:42,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +56: [2023-04-29 11:26:42,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 11:26:42,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 11:26:42,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +53: [2023-04-29 11:26:42,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +24: [2023-04-29 11:26:42,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +24: [2023-04-29 11:26:42,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +24: [2023-04-29 11:26:42,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 11:26:42,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +49: [2023-04-29 11:26:42,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 11:26:42,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 11:26:42,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +15: [2023-04-29 11:26:42,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +15: [2023-04-29 11:26:42,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +15: [2023-04-29 11:26:42,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +49: [2023-04-29 11:26:42,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 11:26:42,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 11:26:42,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +53: [2023-04-29 11:26:42,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 11:26:42,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 11:26:42,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 11:26:42,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 11:26:42,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 11:26:42,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 11:26:42,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 11:26:42,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 11:26:42,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 11:26:42,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 11:26:42,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 11:26:42,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +49: [2023-04-29 11:26:42,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 11:26:42,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 11:26:42,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 11:26:42,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +20: [2023-04-29 11:26:42,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +20: [2023-04-29 11:26:42,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +20: [2023-04-29 11:26:42,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 7: [2023-04-29 11:26:42,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +62: [2023-04-29 11:26:42,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +20: [2023-04-29 11:26:42,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +59: [2023-04-29 11:26:42,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +59: [2023-04-29 11:26:42,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 11:26:42,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 11:26:42,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +59: [2023-04-29 11:26:42,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 11:26:42,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 11:26:42,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 11:26:42,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 11:26:42,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 11:26:42,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 11:26:42,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 11:26:42,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 11:26:42,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 11:26:42,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 11:26:42,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +20: [2023-04-29 11:26:42,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +59: [2023-04-29 11:26:42,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +59: [2023-04-29 11:26:42,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +20: [2023-04-29 11:26:42,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 11:26:42,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 11:26:42,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 11:26:42,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 11:26:42,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 11:26:42,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 11:26:42,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 11:26:42,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +50: [2023-04-29 11:26:42,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +24: [2023-04-29 11:26:42,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +50: [2023-04-29 11:26:42,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +60: [2023-04-29 11:26:42,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 11:26:42,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +59: [2023-04-29 11:26:42,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +50: [2023-04-29 11:26:42,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +54: [2023-04-29 11:26:42,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +31: [2023-04-29 11:26:42,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +43: [2023-04-29 11:26:42,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +24: [2023-04-29 11:26:42,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +58: [2023-04-29 11:26:42,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +58: [2023-04-29 11:26:42,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +58: [2023-04-29 11:26:42,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +58: [2023-04-29 11:26:42,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +44: [2023-04-29 11:26:42,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 11:26:42,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 11:26:42,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +19: [2023-04-29 11:26:42,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +19: [2023-04-29 11:26:42,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +44: [2023-04-29 11:26:42,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +19: [2023-04-29 11:26:42,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +20: [2023-04-29 11:26:42,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 11:26:42,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +61: [2023-04-29 11:26:42,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 11:26:42,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 11:26:42,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 11:26:42,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +43: [2023-04-29 11:26:42,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +20: [2023-04-29 11:26:42,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 11:26:42,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +14: [2023-04-29 11:26:42,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +43: [2023-04-29 11:26:42,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 11:26:42,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +15: [2023-04-29 11:26:42,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +44: [2023-04-29 11:26:42,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 11:26:42,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +14: [2023-04-29 11:26:42,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +35: [2023-04-29 11:26:42,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +61: [2023-04-29 11:26:42,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 11:26:42,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 11:26:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +14: [2023-04-29 11:26:42,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 11:26:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 11:26:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 11:26:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +44: [2023-04-29 11:26:42,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 11:26:42,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +28: [2023-04-29 11:26:42,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 11:26:42,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +46: [2023-04-29 11:26:42,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 11:26:42,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +44: [2023-04-29 11:26:42,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 11:26:42,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +14: [2023-04-29 11:26:42,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +24: [2023-04-29 11:26:42,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +24: [2023-04-29 11:26:42,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +46: [2023-04-29 11:26:42,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 11:26:42,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +43: [2023-04-29 11:26:42,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +15: [2023-04-29 11:26:42,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +54: [2023-04-29 11:26:42,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 11:26:42,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +47: [2023-04-29 11:26:42,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. + 8: [2023-04-29 11:26:42,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +47: [2023-04-29 11:26:42,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +47: [2023-04-29 11:26:42,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:42,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 11:26:42,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +43: [2023-04-29 11:26:42,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +46: [2023-04-29 11:26:42,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 11:26:42,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 11:26:42,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 11:26:42,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 11:26:42,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +31: [2023-04-29 11:26:42,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +46: [2023-04-29 11:26:42,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +31: [2023-04-29 11:26:42,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +31: [2023-04-29 11:26:42,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +18: [2023-04-29 11:26:42,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +18: [2023-04-29 11:26:42,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +18: [2023-04-29 11:26:42,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +20: [2023-04-29 11:26:42,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 11:26:42,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +52: [2023-04-29 11:26:42,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 11:26:42,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +50: [2023-04-29 11:26:42,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:42,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +47: [2023-04-29 11:26:42,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 11:26:42,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 11:26:42,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +38: [2023-04-29 11:26:42,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +52: [2023-04-29 11:26:42,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 11:26:42,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +52: [2023-04-29 11:26:42,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +28: [2023-04-29 11:26:42,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 11:26:42,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +38: [2023-04-29 11:26:42,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +38: [2023-04-29 11:26:42,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +52: [2023-04-29 11:26:42,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 11:26:42,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 11:26:42,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +59: [2023-04-29 11:26:42,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 11:26:42,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:42,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +52: [2023-04-29 11:26:42,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +34: [2023-04-29 11:26:42,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +34: [2023-04-29 11:26:42,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +46: [2023-04-29 11:26:42,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +46: [2023-04-29 11:26:42,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +52: [2023-04-29 11:26:42,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +52: [2023-04-29 11:26:42,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 11:26:42,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 11:26:42,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:42,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +57: [2023-04-29 11:26:42,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 11:26:42,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 11:26:42,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +54: [2023-04-29 11:26:42,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +57: [2023-04-29 11:26:42,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +20: [2023-04-29 11:26:42,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 11:26:42,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +20: [2023-04-29 11:26:42,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +52: [2023-04-29 11:26:42,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 8: [2023-04-29 11:26:42,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +59: [2023-04-29 11:26:42,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 8: [2023-04-29 11:26:42,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +48: [2023-04-29 11:26:42,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +48: [2023-04-29 11:26:42,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +48: [2023-04-29 11:26:42,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +50: [2023-04-29 11:26:42,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 11:26:42,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 11:26:42,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +46: [2023-04-29 11:26:42,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +46: [2023-04-29 11:26:42,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +58: [2023-04-29 11:26:42,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 11:26:42,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +24: [2023-04-29 11:26:42,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 11:26:42,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +34: [2023-04-29 11:26:42,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +34: [2023-04-29 11:26:42,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +61: [2023-04-29 11:26:42,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 11:26:42,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +61: [2023-04-29 11:26:42,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 11:26:42,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 11:26:42,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 11:26:42,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 11:26:42,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +10: [2023-04-29 11:26:42,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +10: [2023-04-29 11:26:42,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +34: [2023-04-29 11:26:42,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +34: [2023-04-29 11:26:42,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +10: [2023-04-29 11:26:42,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +57: [2023-04-29 11:26:42,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +10: [2023-04-29 11:26:42,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +39: [2023-04-29 11:26:42,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +39: [2023-04-29 11:26:42,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +39: [2023-04-29 11:26:42,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +39: [2023-04-29 11:26:42,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. + 0: [2023-04-29 11:26:42,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +57: [2023-04-29 11:26:42,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +28: [2023-04-29 11:26:42,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +61: [2023-04-29 11:26:42,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +50: [2023-04-29 11:26:42,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +50: [2023-04-29 11:26:42,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +24: [2023-04-29 11:26:42,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +24: [2023-04-29 11:26:42,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +24: [2023-04-29 11:26:42,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 7: [2023-04-29 11:26:42,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +61: [2023-04-29 11:26:42,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 11:26:42,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +47: [2023-04-29 11:26:42,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 11:26:42,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 11:26:42,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 11:26:42,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 11:26:42,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +41: [2023-04-29 11:26:42,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 11:26:42,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 11:26:42,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +37: [2023-04-29 11:26:42,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. + 0: [2023-04-29 11:26:42,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +34: [2023-04-29 11:26:42,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +34: [2023-04-29 11:26:42,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 11:26:42,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 11:26:42,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +18: [2023-04-29 11:26:42,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 11:26:42,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +37: [2023-04-29 11:26:42,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +19: [2023-04-29 11:26:42,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 11:26:42,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +54: [2023-04-29 11:26:42,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 11:26:42,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +28: [2023-04-29 11:26:42,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 11:26:42,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 11:26:42,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +18: [2023-04-29 11:26:42,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 11:26:42,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 11:26:42,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +38: [2023-04-29 11:26:42,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +52: [2023-04-29 11:26:42,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 11:26:42,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 11:26:42,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 11:26:42,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +54: [2023-04-29 11:26:42,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +19: [2023-04-29 11:26:42,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +58: [2023-04-29 11:26:42,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 11:26:42,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 11:26:42,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 11:26:42,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 11:26:42,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +38: [2023-04-29 11:26:42,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +38: [2023-04-29 11:26:42,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 11:26:42,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +52: [2023-04-29 11:26:42,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:42,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 11:26:42,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 11:26:42,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +52: [2023-04-29 11:26:42,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 11:26:42,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 11:26:42,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +28: [2023-04-29 11:26:42,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +52: [2023-04-29 11:26:42,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +48: [2023-04-29 11:26:42,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 11:26:42,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 11:26:42,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 7: [2023-04-29 11:26:42,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +48: [2023-04-29 11:26:42,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 0: [2023-04-29 11:26:42,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +49: [2023-04-29 11:26:42,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 11:26:42,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +10: [2023-04-29 11:26:42,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +44: [2023-04-29 11:26:42,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 11:26:42,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 11:26:42,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 11:26:42,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +40: [2023-04-29 11:26:42,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 11:26:42,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 11:26:42,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 11:26:42,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 0: [2023-04-29 11:26:42,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 0: [2023-04-29 11:26:42,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +62: [2023-04-29 11:26:42,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 11:26:42,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 11:26:42,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +55: [2023-04-29 11:26:42,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +55: [2023-04-29 11:26:42,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. + 7: [2023-04-29 11:26:42,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +42: [2023-04-29 11:26:42,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 11:26:42,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 11:26:42,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 11:26:42,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +10: [2023-04-29 11:26:42,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +36: [2023-04-29 11:26:42,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +10: [2023-04-29 11:26:42,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +39: [2023-04-29 11:26:42,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +39: [2023-04-29 11:26:42,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +40: [2023-04-29 11:26:42,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +40: [2023-04-29 11:26:42,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 11:26:42,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 11:26:42,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +60: [2023-04-29 11:26:42,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +55: [2023-04-29 11:26:42,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +60: [2023-04-29 11:26:42,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 11:26:42,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +10: [2023-04-29 11:26:42,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +48: [2023-04-29 11:26:42,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 11:26:42,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 11:26:42,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 11:26:42,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 11:26:42,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +39: [2023-04-29 11:26:42,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +40: [2023-04-29 11:26:42,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 11:26:42,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +57: [2023-04-29 11:26:42,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +57: [2023-04-29 11:26:42,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +57: [2023-04-29 11:26:42,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +49: [2023-04-29 11:26:42,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 11:26:42,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +42: [2023-04-29 11:26:42,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 7: [2023-04-29 11:26:42,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +49: [2023-04-29 11:26:42,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 11:26:42,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 11:26:42,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 11:26:42,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +56: [2023-04-29 11:26:42,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +42: [2023-04-29 11:26:42,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 11:26:42,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 11:26:42,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 11:26:42,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 11:26:42,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 11:26:42,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +37: [2023-04-29 11:26:42,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 11:26:42,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 11:26:42,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 11:26:42,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 11:26:42,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 11:26:42,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +48: [2023-04-29 11:26:42,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +62: [2023-04-29 11:26:42,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +15: [2023-04-29 11:26:42,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +59: [2023-04-29 11:26:42,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 11:26:42,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 11:26:42,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +41: [2023-04-29 11:26:42,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 11:26:42,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +41: [2023-04-29 11:26:42,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 11:26:42,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 11:26:42,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 11:26:42,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 11:26:42,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 11:26:42,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 11:26:42,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +15: [2023-04-29 11:26:42,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +44: [2023-04-29 11:26:42,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +25: [2023-04-29 11:26:42,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +25: [2023-04-29 11:26:42,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +25: [2023-04-29 11:26:42,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +25: [2023-04-29 11:26:42,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +41: [2023-04-29 11:26:42,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 11:26:42,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 11:26:42,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 11:26:42,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 11:26:42,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 11:26:42,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +20: [2023-04-29 11:26:42,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +56: [2023-04-29 11:26:42,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 11:26:42,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 11:26:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 11:26:42,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 11:26:42,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 11:26:42,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +15: [2023-04-29 11:26:42,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +35: [2023-04-29 11:26:42,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 11:26:42,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 11:26:42,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 11:26:42,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +15: [2023-04-29 11:26:42,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +45: [2023-04-29 11:26:42,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +45: [2023-04-29 11:26:42,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +20: [2023-04-29 11:26:42,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +59: [2023-04-29 11:26:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +32: [2023-04-29 11:26:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 11:26:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 11:26:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +23: [2023-04-29 11:26:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +23: [2023-04-29 11:26:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +20: [2023-04-29 11:26:42,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +23: [2023-04-29 11:26:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +32: [2023-04-29 11:26:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +23: [2023-04-29 11:26:42,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +42: [2023-04-29 11:26:42,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +20: [2023-04-29 11:26:42,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +62: [2023-04-29 11:26:42,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +45: [2023-04-29 11:26:42,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 11:26:42,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 11:26:42,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +62: [2023-04-29 11:26:42,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 11:26:42,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +45: [2023-04-29 11:26:42,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 11:26:42,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +20: [2023-04-29 11:26:42,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +40: [2023-04-29 11:26:42,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +40: [2023-04-29 11:26:42,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +40: [2023-04-29 11:26:42,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +40: [2023-04-29 11:26:42,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +59: [2023-04-29 11:26:42,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 11:26:42,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +20: [2023-04-29 11:26:42,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +46: [2023-04-29 11:26:42,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 11:26:42,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 11:26:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 11:26:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 11:26:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 11:26:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +32: [2023-04-29 11:26:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 11:26:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 11:26:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 11:26:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 11:26:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 11:26:42,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +50: [2023-04-29 11:26:42,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 11:26:42,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +57: [2023-04-29 11:26:42,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 11:26:42,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 11:26:42,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +59: [2023-04-29 11:26:42,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +35: [2023-04-29 11:26:42,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +35: [2023-04-29 11:26:42,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 11:26:42,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +59: [2023-04-29 11:26:42,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +35: [2023-04-29 11:26:42,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 11:26:42,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 11:26:42,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 11:26:42,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 11:26:42,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 11:26:42,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +49: [2023-04-29 11:26:42,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 11:26:42,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +60: [2023-04-29 11:26:42,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +20: [2023-04-29 11:26:42,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +42: [2023-04-29 11:26:42,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +42: [2023-04-29 11:26:42,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +42: [2023-04-29 11:26:42,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +50: [2023-04-29 11:26:42,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +42: [2023-04-29 11:26:42,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 11:26:42,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +60: [2023-04-29 11:26:42,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 11:26:42,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +18: [2023-04-29 11:26:43,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +42: [2023-04-29 11:26:43,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 11:26:43,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 11:26:43,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 11:26:43,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 11:26:43,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +42: [2023-04-29 11:26:43,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 11:26:43,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 11:26:43,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +60: [2023-04-29 11:26:43,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 11:26:43,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +25: [2023-04-29 11:26:43,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +20: [2023-04-29 11:26:43,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +50: [2023-04-29 11:26:43,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +18: [2023-04-29 11:26:43,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +25: [2023-04-29 11:26:43,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 11:26:43,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +43: [2023-04-29 11:26:43,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 11:26:43,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 11:26:43,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 11:26:43,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +57: [2023-04-29 11:26:43,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 11:26:43,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +25: [2023-04-29 11:26:43,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +46: [2023-04-29 11:26:43,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 11:26:43,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 11:26:43,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 11:26:43,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 11:26:43,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 11:26:43,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +38: [2023-04-29 11:26:43,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +59: [2023-04-29 11:26:43,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:43,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 11:26:43,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +56: [2023-04-29 11:26:43,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +22: [2023-04-29 11:26:43,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +22: [2023-04-29 11:26:43,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +19: [2023-04-29 11:26:43,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 11:26:43,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +58: [2023-04-29 11:26:43,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +58: [2023-04-29 11:26:43,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +18: [2023-04-29 11:26:43,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +50: [2023-04-29 11:26:43,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +58: [2023-04-29 11:26:43,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 11:26:43,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +22: [2023-04-29 11:26:43,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +50: [2023-04-29 11:26:43,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +45: [2023-04-29 11:26:43,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +45: [2023-04-29 11:26:43,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +45: [2023-04-29 11:26:43,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +22: [2023-04-29 11:26:43,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +49: [2023-04-29 11:26:43,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 11:26:43,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 11:26:43,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 11:26:43,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +43: [2023-04-29 11:26:43,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 11:26:43,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 11:26:43,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 11:26:43,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 11:26:43,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:43,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +38: [2023-04-29 11:26:43,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +19: [2023-04-29 11:26:43,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 11:26:43,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 11:26:43,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +19: [2023-04-29 11:26:43,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +58: [2023-04-29 11:26:43,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +46: [2023-04-29 11:26:43,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +18: [2023-04-29 11:26:43,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +19: [2023-04-29 11:26:43,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +19: [2023-04-29 11:26:43,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +58: [2023-04-29 11:26:43,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +38: [2023-04-29 11:26:43,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 11:26:43,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 11:26:43,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 11:26:43,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +38: [2023-04-29 11:26:43,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +47: [2023-04-29 11:26:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +38: [2023-04-29 11:26:43,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +12: [2023-04-29 11:26:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +12: [2023-04-29 11:26:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +12: [2023-04-29 11:26:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +12: [2023-04-29 11:26:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +48: [2023-04-29 11:26:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 11:26:43,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +59: [2023-04-29 11:26:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 11:26:43,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 11:26:43,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 11:26:43,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +38: [2023-04-29 11:26:43,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 11:26:43,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +19: [2023-04-29 11:26:43,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +19: [2023-04-29 11:26:43,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +18: [2023-04-29 11:26:43,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +18: [2023-04-29 11:26:43,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +40: [2023-04-29 11:26:43,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +58: [2023-04-29 11:26:43,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 11:26:43,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 11:26:43,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 11:26:43,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +36: [2023-04-29 11:26:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +36: [2023-04-29 11:26:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +23: [2023-04-29 11:26:43,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 11:26:43,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +59: [2023-04-29 11:26:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +38: [2023-04-29 11:26:43,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +46: [2023-04-29 11:26:43,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +38: [2023-04-29 11:26:43,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +36: [2023-04-29 11:26:43,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +23: [2023-04-29 11:26:43,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +39: [2023-04-29 11:26:43,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 11:26:43,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +23: [2023-04-29 11:26:43,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +36: [2023-04-29 11:26:43,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +32: [2023-04-29 11:26:43,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +32: [2023-04-29 11:26:43,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +42: [2023-04-29 11:26:43,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 11:26:43,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +23: [2023-04-29 11:26:43,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +48: [2023-04-29 11:26:43,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 11:26:43,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 11:26:43,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +10: [2023-04-29 11:26:43,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +10: [2023-04-29 11:26:43,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +32: [2023-04-29 11:26:43,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. + 4: [2023-04-29 11:26:43,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 4: [2023-04-29 11:26:43,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 4: [2023-04-29 11:26:43,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +42: [2023-04-29 11:26:43,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +42: [2023-04-29 11:26:43,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +40: [2023-04-29 11:26:43,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 11:26:43,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +39: [2023-04-29 11:26:43,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +32: [2023-04-29 11:26:43,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +37: [2023-04-29 11:26:43,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +46: [2023-04-29 11:26:43,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 11:26:43,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +57: [2023-04-29 11:26:43,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 11:26:43,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 11:26:43,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 11:26:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 11:26:43,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 11:26:43,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +10: [2023-04-29 11:26:43,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +10: [2023-04-29 11:26:43,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +39: [2023-04-29 11:26:43,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 11:26:43,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +39: [2023-04-29 11:26:43,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 11:26:43,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +22: [2023-04-29 11:26:43,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +45: [2023-04-29 11:26:43,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +57: [2023-04-29 11:26:43,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +22: [2023-04-29 11:26:43,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 11:26:43,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +37: [2023-04-29 11:26:43,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +45: [2023-04-29 11:26:43,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 11:26:43,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 11:26:43,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +22: [2023-04-29 11:26:43,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +63: [2023-04-29 11:26:43,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 11:26:43,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 11:26:43,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 11:26:43,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 11:26:43,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +48: [2023-04-29 11:26:43,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +48: [2023-04-29 11:26:43,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +10: [2023-04-29 11:26:43,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +39: [2023-04-29 11:26:43,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +46: [2023-04-29 11:26:43,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +39: [2023-04-29 11:26:43,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +22: [2023-04-29 11:26:43,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +48: [2023-04-29 11:26:43,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 11:26:43,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 11:26:43,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +12: [2023-04-29 11:26:43,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +10: [2023-04-29 11:26:43,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +40: [2023-04-29 11:26:43,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 11:26:43,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +45: [2023-04-29 11:26:43,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +46: [2023-04-29 11:26:43,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 11:26:43,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 11:26:43,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 11:26:43,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 11:26:43,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +12: [2023-04-29 11:26:43,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +63: [2023-04-29 11:26:43,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 11:26:43,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +61: [2023-04-29 11:26:43,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +46: [2023-04-29 11:26:43,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +63: [2023-04-29 11:26:43,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 11:26:43,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 11:26:43,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 11:26:43,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 11:26:43,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +12: [2023-04-29 11:26:43,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +32: [2023-04-29 11:26:43,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 11:26:43,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +58: [2023-04-29 11:26:43,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 11:26:43,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +36: [2023-04-29 11:26:43,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +36: [2023-04-29 11:26:43,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 11:26:43,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 11:26:43,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +37: [2023-04-29 11:26:43,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +48: [2023-04-29 11:26:43,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +37: [2023-04-29 11:26:43,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +35: [2023-04-29 11:26:43,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 11:26:43,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +55: [2023-04-29 11:26:43,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 11:26:43,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +37: [2023-04-29 11:26:43,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +45: [2023-04-29 11:26:43,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +58: [2023-04-29 11:26:43,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 11:26:43,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 11:26:43,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +32: [2023-04-29 11:26:43,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 11:26:43,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +32: [2023-04-29 11:26:43,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 11:26:43,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... + 4: [2023-04-29 11:26:43,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 2: [2023-04-29 11:26:43,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 2: [2023-04-29 11:26:43,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 2: [2023-04-29 11:26:43,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 4: [2023-04-29 11:26:43,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +36: [2023-04-29 11:26:43,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 11:26:43,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +30: [2023-04-29 11:26:43,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 11:26:43,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 11:26:43,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 11:26:43,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +35: [2023-04-29 11:26:43,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 11:26:43,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +25: [2023-04-29 11:26:43,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +57: [2023-04-29 11:26:43,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +19: [2023-04-29 11:26:43,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 11:26:43,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 11:26:43,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +40: [2023-04-29 11:26:43,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 11:26:43,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +19: [2023-04-29 11:26:43,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +63: [2023-04-29 11:26:43,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +63: [2023-04-29 11:26:43,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +57: [2023-04-29 11:26:43,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 11:26:43,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 11:26:43,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +30: [2023-04-29 11:26:43,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +30: [2023-04-29 11:26:43,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +30: [2023-04-29 11:26:43,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +32: [2023-04-29 11:26:43,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +30: [2023-04-29 11:26:43,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 11:26:43,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +55: [2023-04-29 11:26:43,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +48: [2023-04-29 11:26:43,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 11:26:43,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 11:26:43,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 11:26:43,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +25: [2023-04-29 11:26:43,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +26: [2023-04-29 11:26:43,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +26: [2023-04-29 11:26:43,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +26: [2023-04-29 11:26:43,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +26: [2023-04-29 11:26:43,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +57: [2023-04-29 11:26:43,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 11:26:43,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +57: [2023-04-29 11:26:43,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +19: [2023-04-29 11:26:43,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +48: [2023-04-29 11:26:43,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 11:26:43,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +19: [2023-04-29 11:26:43,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +57: [2023-04-29 11:26:43,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +45: [2023-04-29 11:26:43,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 11:26:43,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +57: [2023-04-29 11:26:43,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +19: [2023-04-29 11:26:43,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 11:26:43,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +25: [2023-04-29 11:26:43,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 11:26:43,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 11:26:43,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +63: [2023-04-29 11:26:43,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +19: [2023-04-29 11:26:43,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 11:26:43,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 11:26:43,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 11:26:43,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 11:26:43,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 11:26:43,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 11:26:43,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 11:26:43,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 11:26:43,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 11:26:43,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 11:26:43,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 11:26:43,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 11:26:43,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +57: [2023-04-29 11:26:43,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +55: [2023-04-29 11:26:43,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +25: [2023-04-29 11:26:43,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +61: [2023-04-29 11:26:43,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 11:26:43,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 11:26:43,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 11:26:43,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 11:26:43,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 11:26:43,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +25: [2023-04-29 11:26:43,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +55: [2023-04-29 11:26:43,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +55: [2023-04-29 11:26:43,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +25: [2023-04-29 11:26:43,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +56: [2023-04-29 11:26:43,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +34: [2023-04-29 11:26:43,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 11:26:43,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +56: [2023-04-29 11:26:43,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 11:26:43,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 11:26:43,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +36: [2023-04-29 11:26:43,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 11:26:43,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +14: [2023-04-29 11:26:43,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +14: [2023-04-29 11:26:43,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +14: [2023-04-29 11:26:43,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 1: [2023-04-29 11:26:43,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 1: [2023-04-29 11:26:43,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 1: [2023-04-29 11:26:43,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 1: [2023-04-29 11:26:43,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +14: [2023-04-29 11:26:43,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +56: [2023-04-29 11:26:43,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +56: [2023-04-29 11:26:43,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +23: [2023-04-29 11:26:43,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 5: [2023-04-29 11:26:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 5: [2023-04-29 11:26:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +44: [2023-04-29 11:26:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +44: [2023-04-29 11:26:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. + 5: [2023-04-29 11:26:43,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 2: [2023-04-29 11:26:43,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 11:26:43,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +43: [2023-04-29 11:26:43,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +23: [2023-04-29 11:26:43,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +44: [2023-04-29 11:26:43,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +44: [2023-04-29 11:26:43,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +42: [2023-04-29 11:26:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +42: [2023-04-29 11:26:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +23: [2023-04-29 11:26:43,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +32: [2023-04-29 11:26:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 11:26:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 11:26:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 11:26:43,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 11:26:43,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 11:26:43,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +35: [2023-04-29 11:26:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 11:26:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +23: [2023-04-29 11:26:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 11:26:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +26: [2023-04-29 11:26:43,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 8: [2023-04-29 11:26:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +40: [2023-04-29 11:26:43,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 11:26:43,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +63: [2023-04-29 11:26:43,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +40: [2023-04-29 11:26:43,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 11:26:43,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +40: [2023-04-29 11:26:43,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +35: [2023-04-29 11:26:43,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +23: [2023-04-29 11:26:43,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 4: [2023-04-29 11:26:43,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +43: [2023-04-29 11:26:43,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 11:26:43,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +42: [2023-04-29 11:26:43,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +42: [2023-04-29 11:26:43,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +22: [2023-04-29 11:26:43,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 11:26:43,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 11:26:43,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +42: [2023-04-29 11:26:43,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 8: [2023-04-29 11:26:43,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +43: [2023-04-29 11:26:43,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +43: [2023-04-29 11:26:43,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +40: [2023-04-29 11:26:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... + 8: [2023-04-29 11:26:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 8: [2023-04-29 11:26:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 6: [2023-04-29 11:26:43,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 6: [2023-04-29 11:26:43,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +26: [2023-04-29 11:26:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 11:26:43,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +23: [2023-04-29 11:26:43,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +45: [2023-04-29 11:26:43,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +23: [2023-04-29 11:26:43,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +12: [2023-04-29 11:26:43,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +22: [2023-04-29 11:26:43,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 11:26:43,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +22: [2023-04-29 11:26:43,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +40: [2023-04-29 11:26:43,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +40: [2023-04-29 11:26:43,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +40: [2023-04-29 11:26:43,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +42: [2023-04-29 11:26:43,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +21: [2023-04-29 11:26:43,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +21: [2023-04-29 11:26:43,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +14: [2023-04-29 11:26:43,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +14: [2023-04-29 11:26:43,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +14: [2023-04-29 11:26:43,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +32: [2023-04-29 11:26:43,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 11:26:43,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 11:26:43,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +63: [2023-04-29 11:26:43,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 11:26:43,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 1: [2023-04-29 11:26:43,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 11:26:43,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +12: [2023-04-29 11:26:43,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +12: [2023-04-29 11:26:43,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +45: [2023-04-29 11:26:43,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +28: [2023-04-29 11:26:43,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +28: [2023-04-29 11:26:43,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +12: [2023-04-29 11:26:43,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 11:26:43,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +63: [2023-04-29 11:26:43,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +28: [2023-04-29 11:26:43,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +45: [2023-04-29 11:26:43,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +22: [2023-04-29 11:26:43,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 11:26:43,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +32: [2023-04-29 11:26:43,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... + 5: [2023-04-29 11:26:43,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +63: [2023-04-29 11:26:43,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +36: [2023-04-29 11:26:43,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +36: [2023-04-29 11:26:43,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +45: [2023-04-29 11:26:43,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +14: [2023-04-29 11:26:43,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +12: [2023-04-29 11:26:43,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +12: [2023-04-29 11:26:43,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +44: [2023-04-29 11:26:43,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +12: [2023-04-29 11:26:43,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +44: [2023-04-29 11:26:43,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 11:26:43,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +44: [2023-04-29 11:26:43,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +36: [2023-04-29 11:26:43,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +22: [2023-04-29 11:26:43,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +30: [2023-04-29 11:26:43,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +30: [2023-04-29 11:26:43,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 4: [2023-04-29 11:26:43,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 11:26:43,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +17: [2023-04-29 11:26:43,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +36: [2023-04-29 11:26:43,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +36: [2023-04-29 11:26:43,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +17: [2023-04-29 11:26:43,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +17: [2023-04-29 11:26:43,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +30: [2023-04-29 11:26:43,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +36: [2023-04-29 11:26:43,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +36: [2023-04-29 11:26:43,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +30: [2023-04-29 11:26:43,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +61: [2023-04-29 11:26:43,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 11:26:43,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 4: [2023-04-29 11:26:43,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 6: [2023-04-29 11:26:43,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +45: [2023-04-29 11:26:43,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +61: [2023-04-29 11:26:43,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... + 6: [2023-04-29 11:26:43,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +32: [2023-04-29 11:26:43,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +16: [2023-04-29 11:26:43,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +32: [2023-04-29 11:26:43,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +16: [2023-04-29 11:26:43,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +63: [2023-04-29 11:26:43,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 11:26:43,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +16: [2023-04-29 11:26:43,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +32: [2023-04-29 11:26:43,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 11:26:43,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 11:26:43,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +30: [2023-04-29 11:26:43,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +33: [2023-04-29 11:26:43,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 11:26:43,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 11:26:43,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 11:26:43,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 11:26:43,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +19: [2023-04-29 11:26:43,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +16: [2023-04-29 11:26:43,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +16: [2023-04-29 11:26:43,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +62: [2023-04-29 11:26:43,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +62: [2023-04-29 11:26:43,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +63: [2023-04-29 11:26:43,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 11:26:43,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +16: [2023-04-29 11:26:43,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 11:26:43,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +16: [2023-04-29 11:26:43,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +34: [2023-04-29 11:26:43,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +53: [2023-04-29 11:26:43,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +53: [2023-04-29 11:26:43,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +53: [2023-04-29 11:26:43,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. + 4: [2023-04-29 11:26:43,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +62: [2023-04-29 11:26:43,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +45: [2023-04-29 11:26:43,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +53: [2023-04-29 11:26:43,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +33: [2023-04-29 11:26:43,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 11:26:43,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +19: [2023-04-29 11:26:43,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 11:26:43,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +33: [2023-04-29 11:26:43,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +16: [2023-04-29 11:26:43,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +33: [2023-04-29 11:26:43,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +27: [2023-04-29 11:26:43,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 11:26:43,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 11:26:43,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 11:26:43,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 11:26:43,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 11:26:43,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 11:26:43,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 11:26:43,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 11:26:43,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +27: [2023-04-29 11:26:43,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +27: [2023-04-29 11:26:43,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 3: [2023-04-29 11:26:43,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +34: [2023-04-29 11:26:43,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 11:26:43,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +19: [2023-04-29 11:26:43,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 11:26:43,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +61: [2023-04-29 11:26:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 11:26:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +27: [2023-04-29 11:26:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +27: [2023-04-29 11:26:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +61: [2023-04-29 11:26:43,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +27: [2023-04-29 11:26:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 3: [2023-04-29 11:26:43,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 11:26:43,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 11:26:43,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 11:26:43,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +27: [2023-04-29 11:26:43,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 11:26:43,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 11:26:43,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +32: [2023-04-29 11:26:43,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +27: [2023-04-29 11:26:43,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 11:26:43,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 11:26:43,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +61: [2023-04-29 11:26:43,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +29: [2023-04-29 11:26:43,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +29: [2023-04-29 11:26:43,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 3: [2023-04-29 11:26:43,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +61: [2023-04-29 11:26:43,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +29: [2023-04-29 11:26:43,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +27: [2023-04-29 11:26:43,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +49: [2023-04-29 11:26:43,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +49: [2023-04-29 11:26:43,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +29: [2023-04-29 11:26:43,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +63: [2023-04-29 11:26:43,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +26: [2023-04-29 11:26:43,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +49: [2023-04-29 11:26:43,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. +49: [2023-04-29 11:26:43,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_27-model_01-model_states.pt. + 3: [2023-04-29 11:26:43,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +32: [2023-04-29 11:26:43,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +13: [2023-04-29 11:26:43,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 11:26:43,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +22: [2023-04-29 11:26:43,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +22: [2023-04-29 11:26:43,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 11:26:43,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 11:26:43,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 3: [2023-04-29 11:26:43,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +22: [2023-04-29 11:26:43,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +22: [2023-04-29 11:26:43,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 11:26:43,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 11:26:43,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 4: [2023-04-29 11:26:43,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +17: [2023-04-29 11:26:43,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 11:26:43,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +32: [2023-04-29 11:26:43,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +30: [2023-04-29 11:26:43,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +13: [2023-04-29 11:26:43,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +13: [2023-04-29 11:26:43,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 3: [2023-04-29 11:26:43,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 0: [2023-04-29 11:26:43,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +13: [2023-04-29 11:26:43,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 11:26:43,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 11:26:43,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 11:26:43,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +22: [2023-04-29 11:26:43,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 11:26:43,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 11:26:43,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 11:26:43,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 11:26:43,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +32: [2023-04-29 11:26:43,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +13: [2023-04-29 11:26:43,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 11:26:43,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. + 2: [2023-04-29 11:26:43,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +34: [2023-04-29 11:26:43,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +13: [2023-04-29 11:26:43,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +26: [2023-04-29 11:26:43,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +32: [2023-04-29 11:26:43,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +22: [2023-04-29 11:26:43,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 11:26:43,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +53: [2023-04-29 11:26:43,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 11:26:43,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 9: [2023-04-29 11:26:43,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 4: [2023-04-29 11:26:43,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +63: [2023-04-29 11:26:43,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +62: [2023-04-29 11:26:43,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 11:26:43,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 11:26:43,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 11:26:43,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +14: [2023-04-29 11:26:43,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +53: [2023-04-29 11:26:43,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +63: [2023-04-29 11:26:43,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 11:26:43,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 11:26:43,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +26: [2023-04-29 11:26:43,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +11: [2023-04-29 11:26:43,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +26: [2023-04-29 11:26:43,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +11: [2023-04-29 11:26:43,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +16: [2023-04-29 11:26:43,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +30: [2023-04-29 11:26:43,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 11:26:43,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 11:26:43,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +15: [2023-04-29 11:26:43,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +19: [2023-04-29 11:26:43,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 11:26:43,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 11:26:43,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 11:26:43,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +27: [2023-04-29 11:26:43,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +26: [2023-04-29 11:26:43,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +32: [2023-04-29 11:26:43,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +27: [2023-04-29 11:26:43,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +19: [2023-04-29 11:26:43,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +30: [2023-04-29 11:26:43,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 11:26:43,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 5: [2023-04-29 11:26:43,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 11:26:43,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +10: [2023-04-29 11:26:43,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +10: [2023-04-29 11:26:43,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +10: [2023-04-29 11:26:43,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 11:26:43,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 11:26:43,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +34: [2023-04-29 11:26:43,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 11:26:43,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +10: [2023-04-29 11:26:43,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +30: [2023-04-29 11:26:43,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 11:26:43,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_05-model_01-model_states.pt. +11: [2023-04-29 11:26:43,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 11:26:43,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +11: [2023-04-29 11:26:43,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 9: [2023-04-29 11:26:43,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 11:26:43,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +21: [2023-04-29 11:26:43,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 11:26:43,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 11:26:43,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 11:26:43,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +53: [2023-04-29 11:26:43,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 11:26:43,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 11:26:43,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 11:26:43,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 11:26:43,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 11:26:43,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +15: [2023-04-29 11:26:43,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 11:26:43,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +39: [2023-04-29 11:26:43,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 11:26:43,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 11:26:43,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 11:26:43,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 11:26:43,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +14: [2023-04-29 11:26:43,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +39: [2023-04-29 11:26:43,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +14: [2023-04-29 11:26:43,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 11:26:43,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 11:26:43,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 11:26:43,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 11:26:43,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 11:26:43,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 11:26:43,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +63: [2023-04-29 11:26:43,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +63: [2023-04-29 11:26:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 11:26:43,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +34: [2023-04-29 11:26:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 11:26:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +21: [2023-04-29 11:26:43,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 11:26:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 11:26:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 11:26:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +49: [2023-04-29 11:26:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +21: [2023-04-29 11:26:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +39: [2023-04-29 11:26:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 11:26:43,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 11:26:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +26: [2023-04-29 11:26:43,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +39: [2023-04-29 11:26:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +10: [2023-04-29 11:26:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +39: [2023-04-29 11:26:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +39: [2023-04-29 11:26:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +26: [2023-04-29 11:26:43,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +14: [2023-04-29 11:26:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +14: [2023-04-29 11:26:43,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 9: [2023-04-29 11:26:43,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 11:26:43,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +29: [2023-04-29 11:26:43,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +29: [2023-04-29 11:26:43,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +29: [2023-04-29 11:26:43,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +53: [2023-04-29 11:26:43,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 11:26:43,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +44: [2023-04-29 11:26:43,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 11:26:43,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +63: [2023-04-29 11:26:43,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +31: [2023-04-29 11:26:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 11:26:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 11:26:43,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +49: [2023-04-29 11:26:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +49: [2023-04-29 11:26:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +63: [2023-04-29 11:26:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 11:26:43,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 11:26:43,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +31: [2023-04-29 11:26:43,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 5: [2023-04-29 11:26:43,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 1: [2023-04-29 11:26:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +44: [2023-04-29 11:26:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +44: [2023-04-29 11:26:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +13: [2023-04-29 11:26:43,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +14: [2023-04-29 11:26:43,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +44: [2023-04-29 11:26:43,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +13: [2023-04-29 11:26:43,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +47: [2023-04-29 11:26:43,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +26: [2023-04-29 11:26:43,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 3: [2023-04-29 11:26:43,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +47: [2023-04-29 11:26:43,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 11:26:43,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 11:26:43,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 5: [2023-04-29 11:26:43,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +18: [2023-04-29 11:26:43,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 11:26:43,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +49: [2023-04-29 11:26:43,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt... +18: [2023-04-29 11:26:43,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 11:26:43,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +47: [2023-04-29 11:26:43,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +31: [2023-04-29 11:26:43,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 11:26:43,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 11:26:43,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +44: [2023-04-29 11:26:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +44: [2023-04-29 11:26:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +47: [2023-04-29 11:26:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +13: [2023-04-29 11:26:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +31: [2023-04-29 11:26:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +52: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +37: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +37: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +37: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +14: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +52: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +37: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +13: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +52: [2023-04-29 11:26:43,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +50: [2023-04-29 11:26:43,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 11:26:43,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 11:26:43,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 11:26:43,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +18: [2023-04-29 11:26:43,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 11:26:43,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 11:26:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 11:26:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 11:26:43,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +47: [2023-04-29 11:26:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +24: [2023-04-29 11:26:43,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +24: [2023-04-29 11:26:43,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 5: [2023-04-29 11:26:43,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 9: [2023-04-29 11:26:43,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 11:26:43,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +33: [2023-04-29 11:26:43,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +63: [2023-04-29 11:26:43,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +24: [2023-04-29 11:26:43,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +37: [2023-04-29 11:26:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:43,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:43,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:43,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 11:26:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 11:26:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +37: [2023-04-29 11:26:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 11:26:43,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 11:26:43,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 11:26:43,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +21: [2023-04-29 11:26:43,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +11: [2023-04-29 11:26:43,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +51: [2023-04-29 11:26:43,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 11:26:43,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +55: [2023-04-29 11:26:43,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 11:26:43,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 11:26:43,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +55: [2023-04-29 11:26:43,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +33: [2023-04-29 11:26:43,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +50: [2023-04-29 11:26:43,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 11:26:43,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +50: [2023-04-29 11:26:43,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +63: [2023-04-29 11:26:43,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... + 4: [2023-04-29 11:26:43,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +50: [2023-04-29 11:26:43,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 11:26:43,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +16: [2023-04-29 11:26:43,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +51: [2023-04-29 11:26:43,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 11:26:43,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 11:26:43,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +28: [2023-04-29 11:26:43,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +63: [2023-04-29 11:26:43,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +55: [2023-04-29 11:26:43,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +11: [2023-04-29 11:26:43,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 11:26:43,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +25: [2023-04-29 11:26:43,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +55: [2023-04-29 11:26:43,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 11:26:43,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 11:26:43,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 8: [2023-04-29 11:26:43,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 8: [2023-04-29 11:26:43,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 8: [2023-04-29 11:26:43,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 11:26:43,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 11:26:43,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +25: [2023-04-29 11:26:43,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +33: [2023-04-29 11:26:43,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 11:26:43,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt... +28: [2023-04-29 11:26:43,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 11:26:43,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 6: [2023-04-29 11:26:43,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 6: [2023-04-29 11:26:43,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +25: [2023-04-29 11:26:43,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 11:26:43,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +29: [2023-04-29 11:26:43,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 11:26:43,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 11:26:43,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +25: [2023-04-29 11:26:43,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 11:26:43,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 11:26:43,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +25: [2023-04-29 11:26:43,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +25: [2023-04-29 11:26:43,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +33: [2023-04-29 11:26:43,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +28: [2023-04-29 11:26:43,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 11:26:43,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +28: [2023-04-29 11:26:43,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +21: [2023-04-29 11:26:43,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 11:26:43,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 11:26:43,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +38: [2023-04-29 11:26:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 11:26:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 11:26:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +53: [2023-04-29 11:26:43,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 11:26:43,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +27: [2023-04-29 11:26:43,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 11:26:43,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 11:26:43,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +38: [2023-04-29 11:26:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +17: [2023-04-29 11:26:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +41: [2023-04-29 11:26:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 11:26:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +17: [2023-04-29 11:26:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +33: [2023-04-29 11:26:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +41: [2023-04-29 11:26:43,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 11:26:43,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +33: [2023-04-29 11:26:43,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +16: [2023-04-29 11:26:43,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 11:26:43,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 11:26:43,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 11:26:43,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +29: [2023-04-29 11:26:43,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 11:26:43,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +28: [2023-04-29 11:26:43,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +28: [2023-04-29 11:26:43,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 3: [2023-04-29 11:26:43,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +29: [2023-04-29 11:26:43,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 11:26:43,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +62: [2023-04-29 11:26:43,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +53: [2023-04-29 11:26:43,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +30: [2023-04-29 11:26:43,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +30: [2023-04-29 11:26:43,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +38: [2023-04-29 11:26:43,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +24: [2023-04-29 11:26:43,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 11:26:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 11:26:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 11:26:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 11:26:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 11:26:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +21: [2023-04-29 11:26:43,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +21: [2023-04-29 11:26:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 3: [2023-04-29 11:26:43,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +41: [2023-04-29 11:26:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 11:26:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +30: [2023-04-29 11:26:43,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 11:26:43,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 11:26:43,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 11:26:43,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 11:26:43,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +24: [2023-04-29 11:26:43,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +33: [2023-04-29 11:26:43,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 11:26:43,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 11:26:43,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 11:26:43,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +17: [2023-04-29 11:26:43,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +60: [2023-04-29 11:26:43,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +24: [2023-04-29 11:26:43,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 11:26:43,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 11:26:43,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +30: [2023-04-29 11:26:43,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +22: [2023-04-29 11:26:43,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 11:26:43,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 11:26:43,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +30: [2023-04-29 11:26:43,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +62: [2023-04-29 11:26:43,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +17: [2023-04-29 11:26:43,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +16: [2023-04-29 11:26:43,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +60: [2023-04-29 11:26:43,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 11:26:43,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +16: [2023-04-29 11:26:43,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +62: [2023-04-29 11:26:43,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +22: [2023-04-29 11:26:43,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +53: [2023-04-29 11:26:43,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 11:26:43,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... + 0: [2023-04-29 11:26:43,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +60: [2023-04-29 11:26:43,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +22: [2023-04-29 11:26:43,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +62: [2023-04-29 11:26:43,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +62: [2023-04-29 11:26:43,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +30: [2023-04-29 11:26:43,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 11:26:43,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 11:26:43,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +60: [2023-04-29 11:26:43,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 11:26:43,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +22: [2023-04-29 11:26:43,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 11:26:43,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +62: [2023-04-29 11:26:43,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... + 3: [2023-04-29 11:26:43,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 11:26:43,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +53: [2023-04-29 11:26:43,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +53: [2023-04-29 11:26:43,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 11:26:43,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +10: [2023-04-29 11:26:43,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 11:26:43,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +27: [2023-04-29 11:26:43,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 11:26:43,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 11:26:43,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +15: [2023-04-29 11:26:43,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 11:26:43,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +15: [2023-04-29 11:26:43,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +26: [2023-04-29 11:26:43,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +10: [2023-04-29 11:26:43,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +54: [2023-04-29 11:26:43,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 11:26:43,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 11:26:43,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +29: [2023-04-29 11:26:43,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 11:26:43,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +39: [2023-04-29 11:26:43,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 11:26:43,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 11:26:43,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +15: [2023-04-29 11:26:43,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +15: [2023-04-29 11:26:43,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +54: [2023-04-29 11:26:43,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 11:26:43,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +21: [2023-04-29 11:26:43,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 11:26:43,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 11:26:43,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 11:26:43,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 11:26:43,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 11:26:43,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 11:26:43,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +33: [2023-04-29 11:26:43,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 11:26:43,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +27: [2023-04-29 11:26:43,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 6: [2023-04-29 11:26:43,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +27: [2023-04-29 11:26:43,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 11:26:43,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 11:26:43,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +31: [2023-04-29 11:26:43,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +39: [2023-04-29 11:26:43,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 11:26:43,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +10: [2023-04-29 11:26:43,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +39: [2023-04-29 11:26:43,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 11:26:43,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +31: [2023-04-29 11:26:43,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +29: [2023-04-29 11:26:43,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +31: [2023-04-29 11:26:43,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +33: [2023-04-29 11:26:43,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +54: [2023-04-29 11:26:43,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +54: [2023-04-29 11:26:43,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 11:26:43,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +27: [2023-04-29 11:26:43,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +49: [2023-04-29 11:26:43,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +33: [2023-04-29 11:26:43,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +21: [2023-04-29 11:26:43,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +33: [2023-04-29 11:26:43,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +10: [2023-04-29 11:26:43,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 7: [2023-04-29 11:26:43,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +27: [2023-04-29 11:26:43,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 11:26:43,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +12: [2023-04-29 11:26:43,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +54: [2023-04-29 11:26:43,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +54: [2023-04-29 11:26:43,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +12: [2023-04-29 11:26:43,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 11:26:43,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 11:26:43,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 7: [2023-04-29 11:26:43,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 9: [2023-04-29 11:26:43,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 11:26:43,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 11:26:43,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +22: [2023-04-29 11:26:43,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +53: [2023-04-29 11:26:43,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +49: [2023-04-29 11:26:43,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +16: [2023-04-29 11:26:43,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 11:26:43,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +16: [2023-04-29 11:26:43,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 0: [2023-04-29 11:26:43,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 11:26:43,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +27: [2023-04-29 11:26:43,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 11:26:43,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +29: [2023-04-29 11:26:43,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 11:26:43,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 11:26:43,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 11:26:43,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 11:26:43,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +16: [2023-04-29 11:26:43,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +29: [2023-04-29 11:26:43,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 2: [2023-04-29 11:26:43,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +24: [2023-04-29 11:26:43,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +24: [2023-04-29 11:26:43,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +52: [2023-04-29 11:26:43,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +18: [2023-04-29 11:26:43,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +55: [2023-04-29 11:26:43,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +29: [2023-04-29 11:26:43,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +53: [2023-04-29 11:26:43,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 11:26:43,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 11:26:43,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 11:26:43,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +37: [2023-04-29 11:26:43,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +37: [2023-04-29 11:26:43,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 11:26:43,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +49: [2023-04-29 11:26:43,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_00-model_states.pt. +16: [2023-04-29 11:26:43,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +13: [2023-04-29 11:26:43,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +47: [2023-04-29 11:26:43,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +26: [2023-04-29 11:26:43,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +47: [2023-04-29 11:26:43,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +16: [2023-04-29 11:26:43,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +18: [2023-04-29 11:26:43,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +10: [2023-04-29 11:26:43,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 11:26:43,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +24: [2023-04-29 11:26:43,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +49: [2023-04-29 11:26:43,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +11: [2023-04-29 11:26:43,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +47: [2023-04-29 11:26:43,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 11:26:43,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +24: [2023-04-29 11:26:43,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 11:26:43,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +29: [2023-04-29 11:26:43,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +26: [2023-04-29 11:26:43,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 11:26:43,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 11:26:43,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +51: [2023-04-29 11:26:43,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +10: [2023-04-29 11:26:43,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 11:26:43,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +52: [2023-04-29 11:26:43,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 11:26:43,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +18: [2023-04-29 11:26:43,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 11:26:43,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +15: [2023-04-29 11:26:43,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +55: [2023-04-29 11:26:43,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 11:26:43,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 11:26:43,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +22: [2023-04-29 11:26:43,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +13: [2023-04-29 11:26:43,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 11:26:43,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +37: [2023-04-29 11:26:43,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +37: [2023-04-29 11:26:43,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 11:26:43,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 11:26:43,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +49: [2023-04-29 11:26:43,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt... +24: [2023-04-29 11:26:43,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 11:26:43,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 11:26:43,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +39: [2023-04-29 11:26:43,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +24: [2023-04-29 11:26:43,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +50: [2023-04-29 11:26:43,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 11:26:43,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +55: [2023-04-29 11:26:43,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 11:26:43,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 11:26:43,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 3: [2023-04-29 11:26:43,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +31: [2023-04-29 11:26:43,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 11:26:43,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 11:26:43,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 11:26:43,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +15: [2023-04-29 11:26:43,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +51: [2023-04-29 11:26:43,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 11:26:43,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 11:26:43,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +11: [2023-04-29 11:26:43,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +21: [2023-04-29 11:26:43,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +38: [2023-04-29 11:26:43,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 11:26:43,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 9: [2023-04-29 11:26:43,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +39: [2023-04-29 11:26:43,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 11:26:43,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +21: [2023-04-29 11:26:43,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +55: [2023-04-29 11:26:43,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 11:26:43,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 11:26:43,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... + 7: [2023-04-29 11:26:43,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 11:26:43,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +13: [2023-04-29 11:26:43,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +21: [2023-04-29 11:26:43,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 11:26:43,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 11:26:43,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +10: [2023-04-29 11:26:43,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +39: [2023-04-29 11:26:43,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +23: [2023-04-29 11:26:43,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 11:26:43,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 11:26:43,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +10: [2023-04-29 11:26:43,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 11:26:43,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 11:26:43,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +59: [2023-04-29 11:26:43,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 11:26:43,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 11:26:43,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +31: [2023-04-29 11:26:43,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +59: [2023-04-29 11:26:43,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +11: [2023-04-29 11:26:43,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 11:26:43,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 11:26:43,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 11:26:43,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 11:26:43,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 11:26:43,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 11:26:43,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 11:26:43,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 11:26:43,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +41: [2023-04-29 11:26:43,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +31: [2023-04-29 11:26:43,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +23: [2023-04-29 11:26:43,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 11:26:43,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +13: [2023-04-29 11:26:43,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +14: [2023-04-29 11:26:43,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +52: [2023-04-29 11:26:43,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +14: [2023-04-29 11:26:43,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 11:26:43,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 11:26:43,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +25: [2023-04-29 11:26:43,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +37: [2023-04-29 11:26:43,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 11:26:43,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +31: [2023-04-29 11:26:43,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +38: [2023-04-29 11:26:43,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +25: [2023-04-29 11:26:43,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +51: [2023-04-29 11:26:43,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 11:26:43,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 11:26:43,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 11:26:43,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +11: [2023-04-29 11:26:43,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +59: [2023-04-29 11:26:43,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 11:26:43,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 11:26:43,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +24: [2023-04-29 11:26:43,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 11:26:43,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 11:26:43,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +38: [2023-04-29 11:26:43,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 11:26:43,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 11:26:43,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +18: [2023-04-29 11:26:43,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 11:26:43,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +23: [2023-04-29 11:26:43,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 11:26:43,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 11:26:43,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +23: [2023-04-29 11:26:43,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 11:26:43,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +14: [2023-04-29 11:26:43,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 11:26:43,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 11:26:43,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 11:26:43,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 11:26:43,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:43,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +56: [2023-04-29 11:26:43,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 11:26:43,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +20: [2023-04-29 11:26:43,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 11:26:43,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 7: [2023-04-29 11:26:43,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 11:26:43,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +29: [2023-04-29 11:26:43,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +29: [2023-04-29 11:26:43,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +24: [2023-04-29 11:26:43,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +18: [2023-04-29 11:26:43,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +20: [2023-04-29 11:26:43,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 11:26:43,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 11:26:43,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 11:26:43,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +52: [2023-04-29 11:26:43,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 11:26:43,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 11:26:43,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +37: [2023-04-29 11:26:43,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 11:26:43,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 11:26:43,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +52: [2023-04-29 11:26:43,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 11:26:43,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 11:26:43,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +47: [2023-04-29 11:26:43,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 11:26:43,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +56: [2023-04-29 11:26:43,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 11:26:43,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +38: [2023-04-29 11:26:43,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +20: [2023-04-29 11:26:43,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +20: [2023-04-29 11:26:43,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +56: [2023-04-29 11:26:43,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +20: [2023-04-29 11:26:43,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +50: [2023-04-29 11:26:43,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 11:26:43,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +20: [2023-04-29 11:26:43,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +31: [2023-04-29 11:26:43,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +51: [2023-04-29 11:26:43,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +33: [2023-04-29 11:26:43,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 11:26:43,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 11:26:43,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 11:26:43,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 11:26:43,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +62: [2023-04-29 11:26:43,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 11:26:43,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 11:26:43,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 11:26:43,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 11:26:43,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +29: [2023-04-29 11:26:43,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 11:26:43,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +29: [2023-04-29 11:26:43,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +55: [2023-04-29 11:26:43,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +15: [2023-04-29 11:26:43,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +15: [2023-04-29 11:26:43,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +15: [2023-04-29 11:26:43,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +15: [2023-04-29 11:26:43,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +41: [2023-04-29 11:26:43,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 11:26:43,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +24: [2023-04-29 11:26:43,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +24: [2023-04-29 11:26:43,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +60: [2023-04-29 11:26:43,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +60: [2023-04-29 11:26:43,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +60: [2023-04-29 11:26:43,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +33: [2023-04-29 11:26:43,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 11:26:43,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +60: [2023-04-29 11:26:43,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +25: [2023-04-29 11:26:43,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +50: [2023-04-29 11:26:43,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 11:26:43,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +11: [2023-04-29 11:26:43,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +11: [2023-04-29 11:26:43,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_00-model_states.pt. +17: [2023-04-29 11:26:43,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +62: [2023-04-29 11:26:43,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 11:26:43,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 11:26:43,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 11:26:43,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 11:26:43,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +12: [2023-04-29 11:26:43,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 11:26:43,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +38: [2023-04-29 11:26:43,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 11:26:43,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... + 1: [2023-04-29 11:26:43,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +54: [2023-04-29 11:26:43,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +25: [2023-04-29 11:26:43,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +33: [2023-04-29 11:26:43,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +11: [2023-04-29 11:26:43,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 11:26:43,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 11:26:43,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +24: [2023-04-29 11:26:43,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +50: [2023-04-29 11:26:43,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +12: [2023-04-29 11:26:43,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 11:26:43,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +50: [2023-04-29 11:26:43,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 11:26:43,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +17: [2023-04-29 11:26:43,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 11:26:43,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 11:26:43,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 11:26:43,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 11:26:43,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +54: [2023-04-29 11:26:43,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 11:26:43,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +11: [2023-04-29 11:26:43,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +41: [2023-04-29 11:26:43,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 11:26:43,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +33: [2023-04-29 11:26:43,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +11: [2023-04-29 11:26:43,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt... +29: [2023-04-29 11:26:43,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +41: [2023-04-29 11:26:43,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 11:26:43,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 11:26:43,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +29: [2023-04-29 11:26:43,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +17: [2023-04-29 11:26:43,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +20: [2023-04-29 11:26:43,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +20: [2023-04-29 11:26:43,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +20: [2023-04-29 11:26:43,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +20: [2023-04-29 11:26:43,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +33: [2023-04-29 11:26:43,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... + 7: [2023-04-29 11:26:43,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 11:26:43,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +24: [2023-04-29 11:26:43,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 11:26:43,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +60: [2023-04-29 11:26:43,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 11:26:43,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +15: [2023-04-29 11:26:43,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 0: [2023-04-29 11:26:43,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 0: [2023-04-29 11:26:43,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 0: [2023-04-29 11:26:43,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +15: [2023-04-29 11:26:43,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +15: [2023-04-29 11:26:43,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 8: [2023-04-29 11:26:43,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 8: [2023-04-29 11:26:43,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 8: [2023-04-29 11:26:43,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +54: [2023-04-29 11:26:43,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 8: [2023-04-29 11:26:43,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +54: [2023-04-29 11:26:43,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 11:26:43,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +60: [2023-04-29 11:26:43,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 11:26:43,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 11:26:43,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +12: [2023-04-29 11:26:43,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +12: [2023-04-29 11:26:43,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +12: [2023-04-29 11:26:43,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +60: [2023-04-29 11:26:43,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +54: [2023-04-29 11:26:43,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 11:26:43,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +12: [2023-04-29 11:26:43,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +36: [2023-04-29 11:26:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +24: [2023-04-29 11:26:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 11:26:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +36: [2023-04-29 11:26:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 11:26:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 11:26:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +61: [2023-04-29 11:26:43,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 11:26:43,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +24: [2023-04-29 11:26:43,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +61: [2023-04-29 11:26:43,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 11:26:43,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 11:26:43,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 11:26:43,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 11:26:43,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +43: [2023-04-29 11:26:43,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +43: [2023-04-29 11:26:43,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 11:26:43,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +31: [2023-04-29 11:26:43,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +24: [2023-04-29 11:26:43,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +61: [2023-04-29 11:26:43,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +43: [2023-04-29 11:26:43,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 11:26:43,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 11:26:43,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 11:26:43,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 11:26:43,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +20: [2023-04-29 11:26:43,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +43: [2023-04-29 11:26:43,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 11:26:43,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +20: [2023-04-29 11:26:43,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +24: [2023-04-29 11:26:43,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 11:26:43,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 11:26:43,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +43: [2023-04-29 11:26:43,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +43: [2023-04-29 11:26:43,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +31: [2023-04-29 11:26:43,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 11:26:43,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +41: [2023-04-29 11:26:43,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +41: [2023-04-29 11:26:43,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +41: [2023-04-29 11:26:43,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +41: [2023-04-29 11:26:43,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +31: [2023-04-29 11:26:43,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +43: [2023-04-29 11:26:43,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +43: [2023-04-29 11:26:43,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +43: [2023-04-29 11:26:43,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +23: [2023-04-29 11:26:43,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 11:26:43,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +43: [2023-04-29 11:26:43,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +23: [2023-04-29 11:26:43,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 11:26:43,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +52: [2023-04-29 11:26:43,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +52: [2023-04-29 11:26:43,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +52: [2023-04-29 11:26:43,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +52: [2023-04-29 11:26:43,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +20: [2023-04-29 11:26:43,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +14: [2023-04-29 11:26:43,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 11:26:43,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +56: [2023-04-29 11:26:43,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 11:26:43,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 11:26:43,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 11:26:43,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +28: [2023-04-29 11:26:43,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 11:26:43,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 11:26:43,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +31: [2023-04-29 11:26:43,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 0: [2023-04-29 11:26:43,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +56: [2023-04-29 11:26:43,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +31: [2023-04-29 11:26:43,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +31: [2023-04-29 11:26:43,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 7: [2023-04-29 11:26:43,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 11:26:43,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +56: [2023-04-29 11:26:43,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 11:26:43,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 11:26:43,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 11:26:43,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 11:26:43,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 11:26:43,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 11:26:43,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 11:26:43,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +56: [2023-04-29 11:26:43,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 11:26:43,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +28: [2023-04-29 11:26:43,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 8: [2023-04-29 11:26:43,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +23: [2023-04-29 11:26:43,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +59: [2023-04-29 11:26:43,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +28: [2023-04-29 11:26:43,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 8: [2023-04-29 11:26:43,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 8: [2023-04-29 11:26:43,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +28: [2023-04-29 11:26:43,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 11:26:43,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +28: [2023-04-29 11:26:43,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 11:26:43,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 11:26:43,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 11:26:43,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 11:26:43,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 11:26:43,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 11:26:43,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 11:26:43,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 11:26:43,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +32: [2023-04-29 11:26:43,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 11:26:43,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 11:26:43,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 11:26:43,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 11:26:43,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +20: [2023-04-29 11:26:43,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +49: [2023-04-29 11:26:43,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +49: [2023-04-29 11:26:43,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 11:26:43,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +42: [2023-04-29 11:26:43,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 11:26:43,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 11:26:43,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 11:26:43,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +49: [2023-04-29 11:26:43,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +49: [2023-04-29 11:26:43,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +20: [2023-04-29 11:26:43,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +62: [2023-04-29 11:26:43,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 11:26:43,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 11:26:43,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 11:26:43,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 11:26:43,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 11:26:43,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 11:26:43,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 11:26:43,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 11:26:43,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +49: [2023-04-29 11:26:43,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +42: [2023-04-29 11:26:43,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +20: [2023-04-29 11:26:43,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 11:26:43,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +41: [2023-04-29 11:26:43,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +49: [2023-04-29 11:26:43,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 11:26:43,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 11:26:43,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:43,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:43,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +49: [2023-04-29 11:26:43,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 11:26:43,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 11:26:43,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 11:26:43,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 11:26:43,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:43,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 11:26:43,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:43,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 11:26:43,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 11:26:43,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 11:26:43,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +14: [2023-04-29 11:26:43,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 11:26:43,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 11:26:43,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 11:26:43,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 11:26:43,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 11:26:43,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 11:26:43,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 11:26:43,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 11:26:43,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 11:26:43,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 11:26:43,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 11:26:43,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 11:26:43,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 11:26:43,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +23: [2023-04-29 11:26:43,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +59: [2023-04-29 11:26:43,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 11:26:43,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 11:26:43,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 11:26:43,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 11:26:43,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +46: [2023-04-29 11:26:43,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 11:26:43,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 11:26:43,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +15: [2023-04-29 11:26:43,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +62: [2023-04-29 11:26:43,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 11:26:43,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 11:26:43,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +23: [2023-04-29 11:26:43,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 11:26:43,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +23: [2023-04-29 11:26:43,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +59: [2023-04-29 11:26:43,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 11:26:43,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 11:26:43,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 11:26:43,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +14: [2023-04-29 11:26:43,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 11:26:43,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 11:26:43,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 11:26:43,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 11:26:43,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 11:26:43,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 11:26:43,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 11:26:43,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +40: [2023-04-29 11:26:43,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 11:26:43,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 11:26:43,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 11:26:43,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +15: [2023-04-29 11:26:43,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +60: [2023-04-29 11:26:43,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +60: [2023-04-29 11:26:43,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 11:26:43,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 11:26:43,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 11:26:43,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 11:26:43,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 11:26:43,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +40: [2023-04-29 11:26:43,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +15: [2023-04-29 11:26:43,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +40: [2023-04-29 11:26:43,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +63: [2023-04-29 11:26:43,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 11:26:43,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 11:26:43,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 11:26:43,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +20: [2023-04-29 11:26:43,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 11:26:43,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +15: [2023-04-29 11:26:43,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +57: [2023-04-29 11:26:43,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +57: [2023-04-29 11:26:43,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +23: [2023-04-29 11:26:43,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +62: [2023-04-29 11:26:43,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +20: [2023-04-29 11:26:43,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +57: [2023-04-29 11:26:43,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +57: [2023-04-29 11:26:43,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 11:26:43,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 11:26:43,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 11:26:43,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +15: [2023-04-29 11:26:43,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +60: [2023-04-29 11:26:43,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 11:26:43,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +54: [2023-04-29 11:26:43,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +54: [2023-04-29 11:26:43,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +57: [2023-04-29 11:26:43,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +15: [2023-04-29 11:26:43,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +57: [2023-04-29 11:26:43,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 11:26:43,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +15: [2023-04-29 11:26:43,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +54: [2023-04-29 11:26:43,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +62: [2023-04-29 11:26:43,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 11:26:43,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +35: [2023-04-29 11:26:43,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 11:26:43,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 11:26:43,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 11:26:43,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +20: [2023-04-29 11:26:43,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +35: [2023-04-29 11:26:43,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +60: [2023-04-29 11:26:43,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +61: [2023-04-29 11:26:43,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 11:26:43,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 11:26:43,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +57: [2023-04-29 11:26:43,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +20: [2023-04-29 11:26:43,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +35: [2023-04-29 11:26:43,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 11:26:43,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 11:26:43,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 11:26:43,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 11:26:43,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 11:26:43,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 11:26:43,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 11:26:43,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 11:26:43,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 11:26:43,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 11:26:43,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +36: [2023-04-29 11:26:43,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 11:26:43,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +28: [2023-04-29 11:26:43,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +51: [2023-04-29 11:26:43,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +51: [2023-04-29 11:26:43,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +51: [2023-04-29 11:26:43,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +20: [2023-04-29 11:26:43,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +51: [2023-04-29 11:26:43,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +18: [2023-04-29 11:26:43,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +20: [2023-04-29 11:26:43,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 11:26:43,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +18: [2023-04-29 11:26:43,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +18: [2023-04-29 11:26:43,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 8: [2023-04-29 11:26:43,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 0: [2023-04-29 11:26:43,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +45: [2023-04-29 11:26:43,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 11:26:43,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +20: [2023-04-29 11:26:43,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +28: [2023-04-29 11:26:43,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 11:26:43,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +43: [2023-04-29 11:26:43,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +49: [2023-04-29 11:26:43,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +28: [2023-04-29 11:26:43,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +43: [2023-04-29 11:26:43,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 11:26:43,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +41: [2023-04-29 11:26:43,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +54: [2023-04-29 11:26:43,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +52: [2023-04-29 11:26:43,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 11:26:43,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 11:26:43,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +28: [2023-04-29 11:26:43,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +54: [2023-04-29 11:26:43,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 11:26:43,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 11:26:43,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +41: [2023-04-29 11:26:43,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 8: [2023-04-29 11:26:43,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +20: [2023-04-29 11:26:43,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +20: [2023-04-29 11:26:43,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +61: [2023-04-29 11:26:43,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +61: [2023-04-29 11:26:43,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 0: [2023-04-29 11:26:43,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +43: [2023-04-29 11:26:43,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 11:26:43,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +52: [2023-04-29 11:26:43,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +58: [2023-04-29 11:26:43,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 11:26:43,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 8: [2023-04-29 11:26:43,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +61: [2023-04-29 11:26:43,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 8: [2023-04-29 11:26:43,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +41: [2023-04-29 11:26:43,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +41: [2023-04-29 11:26:43,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +61: [2023-04-29 11:26:43,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:43,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 11:26:43,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 11:26:43,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 11:26:43,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 11:26:43,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 11:26:43,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +61: [2023-04-29 11:26:43,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 11:26:43,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 11:26:43,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 11:26:43,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +28: [2023-04-29 11:26:43,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +32: [2023-04-29 11:26:43,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 11:26:43,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 11:26:43,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +20: [2023-04-29 11:26:43,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +23: [2023-04-29 11:26:43,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +23: [2023-04-29 11:26:43,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +23: [2023-04-29 11:26:43,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +23: [2023-04-29 11:26:43,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +20: [2023-04-29 11:26:43,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +36: [2023-04-29 11:26:43,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 11:26:43,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 11:26:43,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 11:26:43,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 11:26:43,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 11:26:43,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +36: [2023-04-29 11:26:43,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 11:26:43,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 11:26:43,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 11:26:43,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +44: [2023-04-29 11:26:43,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 11:26:43,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 11:26:43,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 11:26:43,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +18: [2023-04-29 11:26:43,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +51: [2023-04-29 11:26:43,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +51: [2023-04-29 11:26:43,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 11:26:43,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +18: [2023-04-29 11:26:43,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 11:26:43,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +46: [2023-04-29 11:26:43,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +18: [2023-04-29 11:26:43,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 11:26:43,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +28: [2023-04-29 11:26:43,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +42: [2023-04-29 11:26:43,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 11:26:43,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 11:26:43,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 11:26:43,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +49: [2023-04-29 11:26:43,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 11:26:43,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 11:26:43,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 11:26:43,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +48: [2023-04-29 11:26:43,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 11:26:43,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 11:26:43,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 11:26:43,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +52: [2023-04-29 11:26:43,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +45: [2023-04-29 11:26:43,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +19: [2023-04-29 11:26:43,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +19: [2023-04-29 11:26:43,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +43: [2023-04-29 11:26:43,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +19: [2023-04-29 11:26:43,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +19: [2023-04-29 11:26:43,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +46: [2023-04-29 11:26:43,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 11:26:43,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +43: [2023-04-29 11:26:43,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +40: [2023-04-29 11:26:43,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 11:26:43,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 11:26:43,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 11:26:43,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +28: [2023-04-29 11:26:43,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 11:26:43,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +28: [2023-04-29 11:26:43,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +40: [2023-04-29 11:26:43,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 11:26:43,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +43: [2023-04-29 11:26:43,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +43: [2023-04-29 11:26:43,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 11:26:43,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 11:26:43,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 11:26:43,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 11:26:43,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 11:26:43,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 11:26:43,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 11:26:43,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +61: [2023-04-29 11:26:43,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 11:26:43,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +43: [2023-04-29 11:26:43,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +34: [2023-04-29 11:26:43,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 11:26:43,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 11:26:43,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 11:26:43,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 11:26:43,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 11:26:43,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 11:26:43,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 11:26:43,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 11:26:43,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 11:26:43,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 11:26:43,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 11:26:43,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 11:26:43,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 11:26:43,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 11:26:43,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 11:26:43,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 11:26:43,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 11:26:43,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 11:26:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +23: [2023-04-29 11:26:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 11:26:43,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +23: [2023-04-29 11:26:43,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +63: [2023-04-29 11:26:43,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 11:26:43,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 11:26:43,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 11:26:43,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 11:26:43,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +35: [2023-04-29 11:26:43,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +23: [2023-04-29 11:26:43,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +23: [2023-04-29 11:26:43,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +57: [2023-04-29 11:26:43,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 11:26:43,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 11:26:43,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 11:26:43,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 11:26:43,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 11:26:43,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +33: [2023-04-29 11:26:43,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 11:26:43,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 11:26:43,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +34: [2023-04-29 11:26:43,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +35: [2023-04-29 11:26:43,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 11:26:43,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 11:26:43,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +44: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +48: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +48: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +57: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +59: [2023-04-29 11:26:43,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +59: [2023-04-29 11:26:43,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +59: [2023-04-29 11:26:43,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +59: [2023-04-29 11:26:43,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +54: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +35: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +35: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +35: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +48: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 11:26:43,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +19: [2023-04-29 11:26:43,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +53: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +53: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +53: [2023-04-29 11:26:43,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +46: [2023-04-29 11:26:43,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 11:26:43,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +48: [2023-04-29 11:26:43,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +48: [2023-04-29 11:26:43,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +19: [2023-04-29 11:26:43,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +35: [2023-04-29 11:26:43,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 11:26:43,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +58: [2023-04-29 11:26:43,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +58: [2023-04-29 11:26:43,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +58: [2023-04-29 11:26:43,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +33: [2023-04-29 11:26:43,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 11:26:43,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 11:26:43,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 11:26:43,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 11:26:43,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 11:26:43,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +19: [2023-04-29 11:26:43,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +54: [2023-04-29 11:26:43,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +40: [2023-04-29 11:26:43,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 11:26:43,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +54: [2023-04-29 11:26:43,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +19: [2023-04-29 11:26:43,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +46: [2023-04-29 11:26:43,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 11:26:43,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 11:26:43,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +25: [2023-04-29 11:26:43,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +25: [2023-04-29 11:26:43,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +25: [2023-04-29 11:26:43,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +25: [2023-04-29 11:26:43,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +54: [2023-04-29 11:26:43,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +40: [2023-04-29 11:26:43,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 11:26:43,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 11:26:43,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 11:26:43,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 11:26:43,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 11:26:43,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +38: [2023-04-29 11:26:43,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +38: [2023-04-29 11:26:43,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +38: [2023-04-29 11:26:43,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +38: [2023-04-29 11:26:43,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +40: [2023-04-29 11:26:43,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +40: [2023-04-29 11:26:43,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 11:26:43,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 11:26:43,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +57: [2023-04-29 11:26:43,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +54: [2023-04-29 11:26:43,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +54: [2023-04-29 11:26:43,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 11:26:43,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +47: [2023-04-29 11:26:43,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 11:26:43,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 11:26:43,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 11:26:43,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 11:26:43,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 11:26:43,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:43,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 11:26:43,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +54: [2023-04-29 11:26:43,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +34: [2023-04-29 11:26:43,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 11:26:43,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +59: [2023-04-29 11:26:43,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 11:26:43,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +12: [2023-04-29 11:26:43,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +12: [2023-04-29 11:26:43,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +12: [2023-04-29 11:26:43,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +53: [2023-04-29 11:26:43,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 11:26:43,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 11:26:43,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 11:26:43,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 11:26:43,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 11:26:43,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 11:26:43,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:43,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +18: [2023-04-29 11:26:43,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +48: [2023-04-29 11:26:43,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:43,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 11:26:43,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 11:26:43,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +53: [2023-04-29 11:26:43,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 11:26:43,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +18: [2023-04-29 11:26:43,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +18: [2023-04-29 11:26:43,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +63: [2023-04-29 11:26:43,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 11:26:43,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +34: [2023-04-29 11:26:43,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 11:26:43,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +48: [2023-04-29 11:26:43,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +57: [2023-04-29 11:26:43,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 11:26:43,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 11:26:43,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +25: [2023-04-29 11:26:43,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 11:26:43,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +51: [2023-04-29 11:26:43,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +51: [2023-04-29 11:26:43,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 11:26:43,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +18: [2023-04-29 11:26:43,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +25: [2023-04-29 11:26:43,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +35: [2023-04-29 11:26:43,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 11:26:43,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 11:26:43,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 11:26:43,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +35: [2023-04-29 11:26:43,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 11:26:43,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 11:26:43,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +58: [2023-04-29 11:26:43,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +25: [2023-04-29 11:26:43,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +25: [2023-04-29 11:26:43,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 11:26:43,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +18: [2023-04-29 11:26:43,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +38: [2023-04-29 11:26:43,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +18: [2023-04-29 11:26:43,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +38: [2023-04-29 11:26:43,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 11:26:43,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 11:26:43,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 11:26:43,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 11:26:43,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 11:26:43,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +51: [2023-04-29 11:26:43,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +38: [2023-04-29 11:26:43,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 11:26:43,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 11:26:43,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 11:26:43,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 11:26:43,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 11:26:43,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 11:26:43,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 11:26:43,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 11:26:43,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 11:26:43,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +12: [2023-04-29 11:26:43,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +61: [2023-04-29 11:26:43,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +55: [2023-04-29 11:26:43,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 11:26:43,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 11:26:43,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +12: [2023-04-29 11:26:43,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 11:26:43,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 11:26:43,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +61: [2023-04-29 11:26:43,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 11:26:43,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 11:26:43,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +23: [2023-04-29 11:26:43,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 11:26:43,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +61: [2023-04-29 11:26:43,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +61: [2023-04-29 11:26:43,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +19: [2023-04-29 11:26:43,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +61: [2023-04-29 11:26:43,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +10: [2023-04-29 11:26:43,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +10: [2023-04-29 11:26:43,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +23: [2023-04-29 11:26:43,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +23: [2023-04-29 11:26:43,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +23: [2023-04-29 11:26:43,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 11:26:43,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +33: [2023-04-29 11:26:43,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +10: [2023-04-29 11:26:43,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +10: [2023-04-29 11:26:43,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +19: [2023-04-29 11:26:43,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 11:26:43,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +34: [2023-04-29 11:26:43,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +23: [2023-04-29 11:26:43,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +19: [2023-04-29 11:26:43,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +23: [2023-04-29 11:26:43,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +19: [2023-04-29 11:26:43,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +34: [2023-04-29 11:26:43,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 11:26:43,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +19: [2023-04-29 11:26:43,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +33: [2023-04-29 11:26:43,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 11:26:43,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 11:26:43,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +19: [2023-04-29 11:26:43,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +37: [2023-04-29 11:26:43,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 11:26:43,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 11:26:43,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 11:26:43,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 11:26:43,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +48: [2023-04-29 11:26:43,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +19: [2023-04-29 11:26:43,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +37: [2023-04-29 11:26:43,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 11:26:43,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +57: [2023-04-29 11:26:43,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +57: [2023-04-29 11:26:43,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +57: [2023-04-29 11:26:43,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +37: [2023-04-29 11:26:43,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 11:26:43,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 11:26:43,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 11:26:43,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +59: [2023-04-29 11:26:43,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 2: [2023-04-29 11:26:43,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 2: [2023-04-29 11:26:43,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 2: [2023-04-29 11:26:43,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +59: [2023-04-29 11:26:43,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 11:26:43,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 11:26:43,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +22: [2023-04-29 11:26:43,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +22: [2023-04-29 11:26:43,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +22: [2023-04-29 11:26:43,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +22: [2023-04-29 11:26:43,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +38: [2023-04-29 11:26:43,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 11:26:43,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 11:26:43,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 11:26:43,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 11:26:43,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 11:26:43,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +26: [2023-04-29 11:26:43,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +26: [2023-04-29 11:26:43,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +26: [2023-04-29 11:26:43,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +26: [2023-04-29 11:26:43,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +34: [2023-04-29 11:26:43,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 11:26:43,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 11:26:43,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 11:26:43,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +34: [2023-04-29 11:26:43,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +25: [2023-04-29 11:26:43,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +59: [2023-04-29 11:26:43,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +59: [2023-04-29 11:26:43,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 11:26:43,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 11:26:43,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +38: [2023-04-29 11:26:43,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 11:26:43,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +10: [2023-04-29 11:26:43,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 11:26:43,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +10: [2023-04-29 11:26:43,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +10: [2023-04-29 11:26:43,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +58: [2023-04-29 11:26:43,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +53: [2023-04-29 11:26:43,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +48: [2023-04-29 11:26:43,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +25: [2023-04-29 11:26:43,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +34: [2023-04-29 11:26:43,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 11:26:43,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +25: [2023-04-29 11:26:43,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +58: [2023-04-29 11:26:43,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 11:26:43,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +10: [2023-04-29 11:26:43,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 11:26:43,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 11:26:43,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +38: [2023-04-29 11:26:43,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +53: [2023-04-29 11:26:43,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 11:26:43,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 11:26:43,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 11:26:43,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 11:26:43,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +42: [2023-04-29 11:26:43,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +42: [2023-04-29 11:26:43,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +42: [2023-04-29 11:26:43,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +48: [2023-04-29 11:26:43,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 11:26:43,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 11:26:43,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +62: [2023-04-29 11:26:43,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 11:26:43,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +46: [2023-04-29 11:26:43,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +25: [2023-04-29 11:26:43,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +48: [2023-04-29 11:26:43,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +33: [2023-04-29 11:26:43,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +25: [2023-04-29 11:26:43,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +48: [2023-04-29 11:26:43,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 11:26:43,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 11:26:43,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 11:26:43,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 11:26:43,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +47: [2023-04-29 11:26:43,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +58: [2023-04-29 11:26:43,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +58: [2023-04-29 11:26:43,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +62: [2023-04-29 11:26:43,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 11:26:43,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +53: [2023-04-29 11:26:43,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +38: [2023-04-29 11:26:43,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +33: [2023-04-29 11:26:43,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 11:26:43,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +25: [2023-04-29 11:26:43,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +46: [2023-04-29 11:26:43,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +50: [2023-04-29 11:26:43,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +50: [2023-04-29 11:26:43,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +50: [2023-04-29 11:26:43,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +50: [2023-04-29 11:26:43,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +48: [2023-04-29 11:26:43,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +35: [2023-04-29 11:26:43,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 11:26:43,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 11:26:43,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +35: [2023-04-29 11:26:43,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +25: [2023-04-29 11:26:43,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +38: [2023-04-29 11:26:43,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +58: [2023-04-29 11:26:43,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +57: [2023-04-29 11:26:43,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +62: [2023-04-29 11:26:43,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 11:26:43,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 11:26:43,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +48: [2023-04-29 11:26:43,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +62: [2023-04-29 11:26:43,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +34: [2023-04-29 11:26:43,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +25: [2023-04-29 11:26:43,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +32: [2023-04-29 11:26:43,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +32: [2023-04-29 11:26:43,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +47: [2023-04-29 11:26:43,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +12: [2023-04-29 11:26:43,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +57: [2023-04-29 11:26:43,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +57: [2023-04-29 11:26:43,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:43,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 11:26:43,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +47: [2023-04-29 11:26:43,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +32: [2023-04-29 11:26:43,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 11:26:43,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +62: [2023-04-29 11:26:43,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +35: [2023-04-29 11:26:43,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +35: [2023-04-29 11:26:43,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +35: [2023-04-29 11:26:43,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +22: [2023-04-29 11:26:43,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +22: [2023-04-29 11:26:43,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 11:26:43,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 11:26:43,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +26: [2023-04-29 11:26:43,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 11:26:43,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 11:26:43,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +12: [2023-04-29 11:26:43,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +57: [2023-04-29 11:26:43,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 11:26:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +40: [2023-04-29 11:26:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +40: [2023-04-29 11:26:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +40: [2023-04-29 11:26:43,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +22: [2023-04-29 11:26:43,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 11:26:43,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +22: [2023-04-29 11:26:43,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +26: [2023-04-29 11:26:43,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +38: [2023-04-29 11:26:43,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... + 2: [2023-04-29 11:26:43,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +34: [2023-04-29 11:26:43,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +55: [2023-04-29 11:26:43,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 11:26:43,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +26: [2023-04-29 11:26:43,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +12: [2023-04-29 11:26:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +38: [2023-04-29 11:26:43,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +12: [2023-04-29 11:26:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +12: [2023-04-29 11:26:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +39: [2023-04-29 11:26:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +39: [2023-04-29 11:26:43,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +34: [2023-04-29 11:26:43,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 11:26:43,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +39: [2023-04-29 11:26:43,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +55: [2023-04-29 11:26:43,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 11:26:43,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +26: [2023-04-29 11:26:43,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 5: [2023-04-29 11:26:43,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 5: [2023-04-29 11:26:43,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 5: [2023-04-29 11:26:43,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +56: [2023-04-29 11:26:43,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +56: [2023-04-29 11:26:43,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +37: [2023-04-29 11:26:43,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +37: [2023-04-29 11:26:43,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +42: [2023-04-29 11:26:43,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 11:26:43,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 11:26:43,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 11:26:43,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:43,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +12: [2023-04-29 11:26:43,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +37: [2023-04-29 11:26:43,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +12: [2023-04-29 11:26:43,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +12: [2023-04-29 11:26:43,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +37: [2023-04-29 11:26:43,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +50: [2023-04-29 11:26:43,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 11:26:43,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +46: [2023-04-29 11:26:43,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 11:26:43,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +46: [2023-04-29 11:26:43,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 11:26:43,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:43,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:43,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 9: [2023-04-29 11:26:43,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +46: [2023-04-29 11:26:43,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:43,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 11:26:43,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 11:26:43,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:43,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 9: [2023-04-29 11:26:43,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +34: [2023-04-29 11:26:43,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 11:26:43,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 11:26:43,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 11:26:43,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 11:26:43,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +33: [2023-04-29 11:26:43,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +33: [2023-04-29 11:26:43,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +32: [2023-04-29 11:26:43,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 11:26:43,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +47: [2023-04-29 11:26:43,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 11:26:43,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 11:26:43,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +40: [2023-04-29 11:26:43,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +47: [2023-04-29 11:26:43,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 11:26:43,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +40: [2023-04-29 11:26:43,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 11:26:43,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 11:26:43,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +32: [2023-04-29 11:26:43,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +39: [2023-04-29 11:26:43,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 11:26:43,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 11:26:43,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 11:26:43,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +41: [2023-04-29 11:26:43,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 11:26:43,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 11:26:43,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +39: [2023-04-29 11:26:43,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 11:26:43,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +10: [2023-04-29 11:26:43,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +41: [2023-04-29 11:26:43,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 11:26:43,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 11:26:43,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 11:26:43,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 11:26:43,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 11:26:43,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 11:26:43,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 11:26:43,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +10: [2023-04-29 11:26:43,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +37: [2023-04-29 11:26:43,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +50: [2023-04-29 11:26:43,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 11:26:43,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 11:26:43,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 11:26:43,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +50: [2023-04-29 11:26:43,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 11:26:43,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 11:26:43,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 5: [2023-04-29 11:26:43,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +60: [2023-04-29 11:26:43,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +60: [2023-04-29 11:26:43,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +60: [2023-04-29 11:26:43,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +60: [2023-04-29 11:26:43,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +56: [2023-04-29 11:26:43,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +10: [2023-04-29 11:26:43,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +10: [2023-04-29 11:26:43,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +37: [2023-04-29 11:26:43,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +10: [2023-04-29 11:26:43,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +37: [2023-04-29 11:26:43,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 11:26:43,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +57: [2023-04-29 11:26:43,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 11:26:43,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 11:26:43,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 11:26:43,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 11:26:43,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 11:26:43,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +50: [2023-04-29 11:26:43,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +50: [2023-04-29 11:26:43,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +10: [2023-04-29 11:26:43,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +33: [2023-04-29 11:26:43,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +10: [2023-04-29 11:26:43,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +52: [2023-04-29 11:26:43,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +52: [2023-04-29 11:26:43,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +10: [2023-04-29 11:26:43,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +57: [2023-04-29 11:26:43,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +37: [2023-04-29 11:26:43,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +33: [2023-04-29 11:26:43,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 11:26:43,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 11:26:43,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +52: [2023-04-29 11:26:43,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +52: [2023-04-29 11:26:43,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +37: [2023-04-29 11:26:43,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 11:26:43,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 11:26:43,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 1: [2023-04-29 11:26:43,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +26: [2023-04-29 11:26:43,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 1: [2023-04-29 11:26:43,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +46: [2023-04-29 11:26:43,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +38: [2023-04-29 11:26:43,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +22: [2023-04-29 11:26:43,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +22: [2023-04-29 11:26:43,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +57: [2023-04-29 11:26:43,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +57: [2023-04-29 11:26:43,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +26: [2023-04-29 11:26:43,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +46: [2023-04-29 11:26:43,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +60: [2023-04-29 11:26:43,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 11:26:43,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 11:26:43,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 11:26:43,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +63: [2023-04-29 11:26:43,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +63: [2023-04-29 11:26:43,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +63: [2023-04-29 11:26:43,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +47: [2023-04-29 11:26:43,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 11:26:43,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +22: [2023-04-29 11:26:43,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +22: [2023-04-29 11:26:43,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +22: [2023-04-29 11:26:43,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +57: [2023-04-29 11:26:43,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +60: [2023-04-29 11:26:43,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 11:26:43,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 11:26:43,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 11:26:43,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 11:26:43,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +26: [2023-04-29 11:26:43,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 6: [2023-04-29 11:26:43,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 6: [2023-04-29 11:26:43,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +47: [2023-04-29 11:26:43,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... + 6: [2023-04-29 11:26:43,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +21: [2023-04-29 11:26:43,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +21: [2023-04-29 11:26:43,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +22: [2023-04-29 11:26:43,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +57: [2023-04-29 11:26:43,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +42: [2023-04-29 11:26:43,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +24: [2023-04-29 11:26:43,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +50: [2023-04-29 11:26:43,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +26: [2023-04-29 11:26:43,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +24: [2023-04-29 11:26:43,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +24: [2023-04-29 11:26:43,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +24: [2023-04-29 11:26:43,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +40: [2023-04-29 11:26:43,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +42: [2023-04-29 11:26:43,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +50: [2023-04-29 11:26:43,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 7: [2023-04-29 11:26:43,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 7: [2023-04-29 11:26:43,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 7: [2023-04-29 11:26:43,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 2: [2023-04-29 11:26:43,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +47: [2023-04-29 11:26:43,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +22: [2023-04-29 11:26:43,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +21: [2023-04-29 11:26:43,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +38: [2023-04-29 11:26:43,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 11:26:43,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +38: [2023-04-29 11:26:43,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:43,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 11:26:43,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +26: [2023-04-29 11:26:43,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +40: [2023-04-29 11:26:43,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +52: [2023-04-29 11:26:43,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 11:26:43,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +27: [2023-04-29 11:26:43,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +27: [2023-04-29 11:26:43,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +27: [2023-04-29 11:26:43,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +52: [2023-04-29 11:26:43,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +27: [2023-04-29 11:26:43,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +26: [2023-04-29 11:26:43,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +55: [2023-04-29 11:26:43,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +55: [2023-04-29 11:26:43,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +50: [2023-04-29 11:26:43,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +42: [2023-04-29 11:26:43,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +22: [2023-04-29 11:26:43,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +26: [2023-04-29 11:26:43,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +38: [2023-04-29 11:26:43,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 11:26:43,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 11:26:43,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 11:26:43,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 11:26:43,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +52: [2023-04-29 11:26:43,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 11:26:43,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 11:26:43,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 11:26:43,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. + 2: [2023-04-29 11:26:43,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 2: [2023-04-29 11:26:43,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 2: [2023-04-29 11:26:43,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +50: [2023-04-29 11:26:43,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +55: [2023-04-29 11:26:43,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +39: [2023-04-29 11:26:43,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +52: [2023-04-29 11:26:43,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +26: [2023-04-29 11:26:43,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +42: [2023-04-29 11:26:43,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +52: [2023-04-29 11:26:43,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +52: [2023-04-29 11:26:43,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 11:26:43,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +52: [2023-04-29 11:26:43,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 11:26:43,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +39: [2023-04-29 11:26:43,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +32: [2023-04-29 11:26:43,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 11:26:43,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +52: [2023-04-29 11:26:43,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +50: [2023-04-29 11:26:43,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +50: [2023-04-29 11:26:43,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +46: [2023-04-29 11:26:43,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +14: [2023-04-29 11:26:43,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +14: [2023-04-29 11:26:43,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +46: [2023-04-29 11:26:43,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +14: [2023-04-29 11:26:43,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +14: [2023-04-29 11:26:43,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +39: [2023-04-29 11:26:43,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 11:26:43,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +37: [2023-04-29 11:26:43,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 11:26:43,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +37: [2023-04-29 11:26:43,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 11:26:43,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +47: [2023-04-29 11:26:43,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +50: [2023-04-29 11:26:43,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +39: [2023-04-29 11:26:43,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 11:26:43,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 11:26:43,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +40: [2023-04-29 11:26:43,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +47: [2023-04-29 11:26:43,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... + 5: [2023-04-29 11:26:43,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +63: [2023-04-29 11:26:43,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +39: [2023-04-29 11:26:43,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +24: [2023-04-29 11:26:43,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +41: [2023-04-29 11:26:43,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +41: [2023-04-29 11:26:43,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +41: [2023-04-29 11:26:43,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 6: [2023-04-29 11:26:43,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 11:26:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 7: [2023-04-29 11:26:43,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +41: [2023-04-29 11:26:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 11:26:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +32: [2023-04-29 11:26:43,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +63: [2023-04-29 11:26:43,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 11:26:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 11:26:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 11:26:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +21: [2023-04-29 11:26:43,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +21: [2023-04-29 11:26:43,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +56: [2023-04-29 11:26:43,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 11:26:43,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +40: [2023-04-29 11:26:43,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +40: [2023-04-29 11:26:43,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +40: [2023-04-29 11:26:43,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +24: [2023-04-29 11:26:43,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +45: [2023-04-29 11:26:43,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 11:26:43,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +21: [2023-04-29 11:26:43,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +37: [2023-04-29 11:26:43,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 11:26:43,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 11:26:43,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +41: [2023-04-29 11:26:43,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +24: [2023-04-29 11:26:43,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 11:26:43,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +45: [2023-04-29 11:26:43,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +45: [2023-04-29 11:26:43,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 11:26:43,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +32: [2023-04-29 11:26:43,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +56: [2023-04-29 11:26:43,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +63: [2023-04-29 11:26:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +45: [2023-04-29 11:26:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +27: [2023-04-29 11:26:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 11:26:43,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +19: [2023-04-29 11:26:43,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 11:26:43,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 11:26:43,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +54: [2023-04-29 11:26:43,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +54: [2023-04-29 11:26:43,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +54: [2023-04-29 11:26:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +19: [2023-04-29 11:26:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 11:26:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +56: [2023-04-29 11:26:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +32: [2023-04-29 11:26:43,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 11:26:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +39: [2023-04-29 11:26:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +55: [2023-04-29 11:26:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +21: [2023-04-29 11:26:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 11:26:43,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +55: [2023-04-29 11:26:43,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +27: [2023-04-29 11:26:43,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 11:26:43,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 11:26:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +56: [2023-04-29 11:26:43,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +27: [2023-04-29 11:26:43,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 11:26:43,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +36: [2023-04-29 11:26:43,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +36: [2023-04-29 11:26:43,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +19: [2023-04-29 11:26:43,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +50: [2023-04-29 11:26:43,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 3: [2023-04-29 11:26:43,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +19: [2023-04-29 11:26:43,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +32: [2023-04-29 11:26:43,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +36: [2023-04-29 11:26:43,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +36: [2023-04-29 11:26:43,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +19: [2023-04-29 11:26:43,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +56: [2023-04-29 11:26:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +14: [2023-04-29 11:26:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +14: [2023-04-29 11:26:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +14: [2023-04-29 11:26:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +55: [2023-04-29 11:26:43,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 4: [2023-04-29 11:26:43,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 4: [2023-04-29 11:26:43,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 3: [2023-04-29 11:26:43,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 4: [2023-04-29 11:26:43,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 3: [2023-04-29 11:26:43,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +33: [2023-04-29 11:26:43,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +14: [2023-04-29 11:26:43,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +56: [2023-04-29 11:26:43,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +56: [2023-04-29 11:26:43,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +50: [2023-04-29 11:26:43,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 5: [2023-04-29 11:26:43,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 5: [2023-04-29 11:26:43,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +60: [2023-04-29 11:26:43,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 11:26:43,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 11:26:43,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +33: [2023-04-29 11:26:43,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +33: [2023-04-29 11:26:43,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 11:26:43,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 11:26:43,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 11:26:43,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +30: [2023-04-29 11:26:43,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 11:26:43,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +33: [2023-04-29 11:26:43,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +33: [2023-04-29 11:26:43,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +30: [2023-04-29 11:26:43,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +33: [2023-04-29 11:26:43,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +37: [2023-04-29 11:26:43,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +41: [2023-04-29 11:26:43,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 11:26:43,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 11:26:43,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +30: [2023-04-29 11:26:43,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +41: [2023-04-29 11:26:43,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 11:26:43,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 11:26:43,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 11:26:43,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 11:26:43,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +60: [2023-04-29 11:26:43,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 11:26:43,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 11:26:43,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +30: [2023-04-29 11:26:43,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +30: [2023-04-29 11:26:43,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +60: [2023-04-29 11:26:43,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +54: [2023-04-29 11:26:43,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +54: [2023-04-29 11:26:43,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 11:26:43,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 11:26:43,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +30: [2023-04-29 11:26:43,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +60: [2023-04-29 11:26:43,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +30: [2023-04-29 11:26:43,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 11:26:43,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 11:26:43,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 11:26:43,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +36: [2023-04-29 11:26:43,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +37: [2023-04-29 11:26:43,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +43: [2023-04-29 11:26:43,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +36: [2023-04-29 11:26:43,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +43: [2023-04-29 11:26:43,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +43: [2023-04-29 11:26:43,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 3: [2023-04-29 11:26:43,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +43: [2023-04-29 11:26:43,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +60: [2023-04-29 11:26:43,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 3: [2023-04-29 11:26:43,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +37: [2023-04-29 11:26:43,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +60: [2023-04-29 11:26:43,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 4: [2023-04-29 11:26:43,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +37: [2023-04-29 11:26:43,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... + 4: [2023-04-29 11:26:43,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 11:26:43,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +17: [2023-04-29 11:26:43,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +50: [2023-04-29 11:26:43,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +17: [2023-04-29 11:26:43,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +17: [2023-04-29 11:26:43,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 1: [2023-04-29 11:26:43,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +52: [2023-04-29 11:26:43,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 11:26:43,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 11:26:43,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 11:26:43,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 11:26:43,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +50: [2023-04-29 11:26:43,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 1: [2023-04-29 11:26:43,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +52: [2023-04-29 11:26:43,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +52: [2023-04-29 11:26:43,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 1: [2023-04-29 11:26:43,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +52: [2023-04-29 11:26:43,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 1: [2023-04-29 11:26:43,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +52: [2023-04-29 11:26:43,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +50: [2023-04-29 11:26:43,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 11:26:43,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 1: [2023-04-29 11:26:43,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +52: [2023-04-29 11:26:43,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 6: [2023-04-29 11:26:43,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +52: [2023-04-29 11:26:43,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +51: [2023-04-29 11:26:43,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +51: [2023-04-29 11:26:43,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +51: [2023-04-29 11:26:43,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +51: [2023-04-29 11:26:43,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 6: [2023-04-29 11:26:43,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +52: [2023-04-29 11:26:43,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +21: [2023-04-29 11:26:43,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +19: [2023-04-29 11:26:43,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 11:26:43,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +28: [2023-04-29 11:26:43,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +63: [2023-04-29 11:26:43,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +28: [2023-04-29 11:26:43,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +28: [2023-04-29 11:26:43,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +43: [2023-04-29 11:26:43,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 11:26:43,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +43: [2023-04-29 11:26:43,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +45: [2023-04-29 11:26:43,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +21: [2023-04-29 11:26:43,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +43: [2023-04-29 11:26:43,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +27: [2023-04-29 11:26:43,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 11:26:43,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +21: [2023-04-29 11:26:43,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +45: [2023-04-29 11:26:43,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 11:26:43,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 11:26:43,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +55: [2023-04-29 11:26:43,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +17: [2023-04-29 11:26:43,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 11:26:43,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +63: [2023-04-29 11:26:43,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +63: [2023-04-29 11:26:43,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +63: [2023-04-29 11:26:43,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +27: [2023-04-29 11:26:43,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +27: [2023-04-29 11:26:43,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 11:26:43,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 11:26:43,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +17: [2023-04-29 11:26:43,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 11:26:43,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +19: [2023-04-29 11:26:43,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 11:26:43,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +55: [2023-04-29 11:26:43,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +11: [2023-04-29 11:26:43,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +11: [2023-04-29 11:26:43,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +27: [2023-04-29 11:26:43,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +55: [2023-04-29 11:26:43,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +11: [2023-04-29 11:26:43,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +21: [2023-04-29 11:26:43,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +11: [2023-04-29 11:26:43,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +21: [2023-04-29 11:26:43,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +14: [2023-04-29 11:26:43,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +14: [2023-04-29 11:26:43,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +14: [2023-04-29 11:26:43,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +27: [2023-04-29 11:26:43,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +27: [2023-04-29 11:26:43,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +27: [2023-04-29 11:26:43,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +63: [2023-04-29 11:26:43,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +63: [2023-04-29 11:26:43,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +19: [2023-04-29 11:26:43,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 11:26:43,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +55: [2023-04-29 11:26:43,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +14: [2023-04-29 11:26:43,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +52: [2023-04-29 11:26:43,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 11:26:43,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +21: [2023-04-29 11:26:43,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +52: [2023-04-29 11:26:43,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +27: [2023-04-29 11:26:43,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +55: [2023-04-29 11:26:43,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +14: [2023-04-29 11:26:43,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +29: [2023-04-29 11:26:43,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +29: [2023-04-29 11:26:43,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +29: [2023-04-29 11:26:43,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +29: [2023-04-29 11:26:43,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +51: [2023-04-29 11:26:43,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 11:26:43,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 11:26:43,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 11:26:43,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 11:26:43,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +51: [2023-04-29 11:26:43,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 11:26:43,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +19: [2023-04-29 11:26:43,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +19: [2023-04-29 11:26:43,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +59: [2023-04-29 11:26:43,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 11:26:43,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +28: [2023-04-29 11:26:43,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +52: [2023-04-29 11:26:43,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 11:26:43,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +36: [2023-04-29 11:26:43,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +28: [2023-04-29 11:26:43,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +28: [2023-04-29 11:26:43,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 11:26:43,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +28: [2023-04-29 11:26:43,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +30: [2023-04-29 11:26:43,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +30: [2023-04-29 11:26:43,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +59: [2023-04-29 11:26:43,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 11:26:43,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 11:26:43,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +59: [2023-04-29 11:26:43,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +59: [2023-04-29 11:26:43,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +36: [2023-04-29 11:26:43,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 11:26:43,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +59: [2023-04-29 11:26:43,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +45: [2023-04-29 11:26:43,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +45: [2023-04-29 11:26:43,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +59: [2023-04-29 11:26:43,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +36: [2023-04-29 11:26:43,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 11:26:43,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +54: [2023-04-29 11:26:43,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 11:26:43,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +30: [2023-04-29 11:26:43,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +30: [2023-04-29 11:26:43,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +45: [2023-04-29 11:26:43,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +41: [2023-04-29 11:26:43,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 11:26:43,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +59: [2023-04-29 11:26:43,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +59: [2023-04-29 11:26:43,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +36: [2023-04-29 11:26:43,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +45: [2023-04-29 11:26:43,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 3: [2023-04-29 11:26:43,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +11: [2023-04-29 11:26:43,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +54: [2023-04-29 11:26:43,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 11:26:43,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 11:26:43,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +13: [2023-04-29 11:26:43,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +41: [2023-04-29 11:26:43,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +13: [2023-04-29 11:26:43,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +13: [2023-04-29 11:26:43,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +16: [2023-04-29 11:26:43,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +16: [2023-04-29 11:26:43,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +13: [2023-04-29 11:26:43,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +16: [2023-04-29 11:26:43,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. +54: [2023-04-29 11:26:43,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +54: [2023-04-29 11:26:43,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 3: [2023-04-29 11:26:43,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 3: [2023-04-29 11:26:43,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +59: [2023-04-29 11:26:43,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +59: [2023-04-29 11:26:43,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +16: [2023-04-29 11:26:43,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_06-model_01-model_states.pt. + 4: [2023-04-29 11:26:43,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +45: [2023-04-29 11:26:43,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 11:26:43,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +54: [2023-04-29 11:26:43,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +11: [2023-04-29 11:26:43,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +54: [2023-04-29 11:26:43,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +41: [2023-04-29 11:26:43,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +30: [2023-04-29 11:26:43,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 11:26:43,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 11:26:43,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +11: [2023-04-29 11:26:43,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +19: [2023-04-29 11:26:43,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +48: [2023-04-29 11:26:43,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +48: [2023-04-29 11:26:43,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +48: [2023-04-29 11:26:43,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +30: [2023-04-29 11:26:43,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +48: [2023-04-29 11:26:43,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +11: [2023-04-29 11:26:43,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 11:26:43,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 11:26:43,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 4: [2023-04-29 11:26:43,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +19: [2023-04-29 11:26:43,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +49: [2023-04-29 11:26:43,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 11:26:43,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 11:26:43,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +45: [2023-04-29 11:26:43,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 11:26:43,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 11:26:43,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 11:26:43,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 11:26:43,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +29: [2023-04-29 11:26:43,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 11:26:43,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +29: [2023-04-29 11:26:43,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +41: [2023-04-29 11:26:43,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +49: [2023-04-29 11:26:43,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 11:26:43,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 11:26:43,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 3: [2023-04-29 11:26:43,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +49: [2023-04-29 11:26:43,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 4: [2023-04-29 11:26:43,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +56: [2023-04-29 11:26:43,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 11:26:43,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 11:26:43,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +46: [2023-04-29 11:26:43,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +36: [2023-04-29 11:26:43,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +44: [2023-04-29 11:26:43,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 11:26:43,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 11:26:43,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 11:26:43,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 11:26:43,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +30: [2023-04-29 11:26:43,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +30: [2023-04-29 11:26:43,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +49: [2023-04-29 11:26:43,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 11:26:43,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 11:26:43,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 11:26:43,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 11:26:43,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +46: [2023-04-29 11:26:43,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 11:26:43,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +59: [2023-04-29 11:26:43,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 11:26:43,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 11:26:43,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 11:26:43,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 11:26:43,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +19: [2023-04-29 11:26:43,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 11:26:43,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 11:26:43,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +30: [2023-04-29 11:26:43,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +59: [2023-04-29 11:26:43,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 11:26:43,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 11:26:43,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 11:26:43,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 11:26:43,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 11:26:43,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 11:26:43,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 11:26:43,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +59: [2023-04-29 11:26:43,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +45: [2023-04-29 11:26:43,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +16: [2023-04-29 11:26:43,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +42: [2023-04-29 11:26:43,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +17: [2023-04-29 11:26:43,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 11:26:43,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +18: [2023-04-29 11:26:43,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +18: [2023-04-29 11:26:43,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +13: [2023-04-29 11:26:43,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +18: [2023-04-29 11:26:43,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +59: [2023-04-29 11:26:43,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +13: [2023-04-29 11:26:43,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +13: [2023-04-29 11:26:43,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +45: [2023-04-29 11:26:43,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +42: [2023-04-29 11:26:43,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 0: [2023-04-29 11:26:43,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 0: [2023-04-29 11:26:43,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 0: [2023-04-29 11:26:43,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +16: [2023-04-29 11:26:43,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +42: [2023-04-29 11:26:43,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 11:26:43,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +13: [2023-04-29 11:26:43,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +43: [2023-04-29 11:26:43,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 11:26:43,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +17: [2023-04-29 11:26:43,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +35: [2023-04-29 11:26:43,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +35: [2023-04-29 11:26:43,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +35: [2023-04-29 11:26:43,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +35: [2023-04-29 11:26:43,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +43: [2023-04-29 11:26:43,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 11:26:43,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +16: [2023-04-29 11:26:43,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt... +48: [2023-04-29 11:26:43,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 11:26:43,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +48: [2023-04-29 11:26:43,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 11:26:43,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 11:26:43,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +17: [2023-04-29 11:26:43,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +17: [2023-04-29 11:26:43,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +43: [2023-04-29 11:26:43,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 8: [2023-04-29 11:26:43,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 8: [2023-04-29 11:26:43,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 8: [2023-04-29 11:26:43,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 8: [2023-04-29 11:26:43,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +30: [2023-04-29 11:26:43,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 11:26:43,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 11:26:43,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 11:26:43,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +43: [2023-04-29 11:26:43,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +43: [2023-04-29 11:26:43,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +17: [2023-04-29 11:26:43,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +17: [2023-04-29 11:26:43,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +17: [2023-04-29 11:26:43,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +58: [2023-04-29 11:26:43,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 11:26:43,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 11:26:43,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 11:26:43,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 11:26:43,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 11:26:43,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 11:26:43,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +58: [2023-04-29 11:26:43,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +51: [2023-04-29 11:26:43,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +48: [2023-04-29 11:26:43,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +21: [2023-04-29 11:26:43,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 11:26:43,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +58: [2023-04-29 11:26:43,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 11:26:43,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 11:26:43,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 11:26:43,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 11:26:43,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +58: [2023-04-29 11:26:43,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +58: [2023-04-29 11:26:43,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +58: [2023-04-29 11:26:43,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +28: [2023-04-29 11:26:43,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +58: [2023-04-29 11:26:43,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 11:26:43,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +21: [2023-04-29 11:26:43,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 11:26:43,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +28: [2023-04-29 11:26:43,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +57: [2023-04-29 11:26:43,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 11:26:43,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 11:26:43,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 11:26:43,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +58: [2023-04-29 11:26:43,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +57: [2023-04-29 11:26:43,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 11:26:43,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +48: [2023-04-29 11:26:43,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +21: [2023-04-29 11:26:43,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +21: [2023-04-29 11:26:43,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +58: [2023-04-29 11:26:43,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +48: [2023-04-29 11:26:43,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 11:26:43,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 11:26:43,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +53: [2023-04-29 11:26:43,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +53: [2023-04-29 11:26:43,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +53: [2023-04-29 11:26:43,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +18: [2023-04-29 11:26:43,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +53: [2023-04-29 11:26:43,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +48: [2023-04-29 11:26:43,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +21: [2023-04-29 11:26:43,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +21: [2023-04-29 11:26:43,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +28: [2023-04-29 11:26:43,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 0: [2023-04-29 11:26:43,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +28: [2023-04-29 11:26:43,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +51: [2023-04-29 11:26:43,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 4: [2023-04-29 11:26:43,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 11:26:43,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 11:26:43,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 11:26:43,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 11:26:43,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +15: [2023-04-29 11:26:43,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +15: [2023-04-29 11:26:43,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +15: [2023-04-29 11:26:43,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +28: [2023-04-29 11:26:43,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +28: [2023-04-29 11:26:43,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +51: [2023-04-29 11:26:43,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +51: [2023-04-29 11:26:43,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 4: [2023-04-29 11:26:43,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +40: [2023-04-29 11:26:43,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 11:26:43,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 11:26:43,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 11:26:43,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +28: [2023-04-29 11:26:43,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +28: [2023-04-29 11:26:43,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +11: [2023-04-29 11:26:43,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +35: [2023-04-29 11:26:43,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 8: [2023-04-29 11:26:43,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 8: [2023-04-29 11:26:43,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 9: [2023-04-29 11:26:43,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +35: [2023-04-29 11:26:43,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 11:26:43,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 11:26:43,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 8: [2023-04-29 11:26:43,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 8: [2023-04-29 11:26:43,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +40: [2023-04-29 11:26:43,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 11:26:43,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +40: [2023-04-29 11:26:43,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +40: [2023-04-29 11:26:43,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +40: [2023-04-29 11:26:43,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 11:26:43,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +44: [2023-04-29 11:26:43,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +44: [2023-04-29 11:26:43,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +44: [2023-04-29 11:26:43,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +29: [2023-04-29 11:26:43,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +56: [2023-04-29 11:26:43,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 11:26:43,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 11:26:43,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +49: [2023-04-29 11:26:43,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +11: [2023-04-29 11:26:43,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +11: [2023-04-29 11:26:43,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +49: [2023-04-29 11:26:43,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +49: [2023-04-29 11:26:43,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_28-model_01-model_states.pt. +29: [2023-04-29 11:26:43,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +59: [2023-04-29 11:26:43,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +29: [2023-04-29 11:26:43,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +29: [2023-04-29 11:26:43,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +59: [2023-04-29 11:26:43,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +11: [2023-04-29 11:26:43,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +49: [2023-04-29 11:26:43,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +11: [2023-04-29 11:26:43,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +11: [2023-04-29 11:26:43,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +58: [2023-04-29 11:26:43,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 11:26:43,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 11:26:43,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +53: [2023-04-29 11:26:43,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 11:26:43,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +58: [2023-04-29 11:26:43,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +29: [2023-04-29 11:26:43,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +29: [2023-04-29 11:26:43,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +45: [2023-04-29 11:26:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +30: [2023-04-29 11:26:43,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +53: [2023-04-29 11:26:43,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 11:26:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +53: [2023-04-29 11:26:43,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +20: [2023-04-29 11:26:43,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +59: [2023-04-29 11:26:43,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +15: [2023-04-29 11:26:43,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +56: [2023-04-29 11:26:43,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +20: [2023-04-29 11:26:43,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +20: [2023-04-29 11:26:43,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +46: [2023-04-29 11:26:43,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 11:26:43,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +20: [2023-04-29 11:26:43,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +29: [2023-04-29 11:26:43,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +15: [2023-04-29 11:26:43,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 11:26:43,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 11:26:43,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... + 6: [2023-04-29 11:26:43,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 11:26:43,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +59: [2023-04-29 11:26:43,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 11:26:43,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 11:26:43,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 11:26:43,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 11:26:43,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +30: [2023-04-29 11:26:43,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +30: [2023-04-29 11:26:43,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +56: [2023-04-29 11:26:43,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 11:26:43,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +16: [2023-04-29 11:26:43,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +31: [2023-04-29 11:26:43,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +31: [2023-04-29 11:26:43,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +31: [2023-04-29 11:26:43,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +31: [2023-04-29 11:26:43,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +44: [2023-04-29 11:26:43,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 11:26:43,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +29: [2023-04-29 11:26:43,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +45: [2023-04-29 11:26:43,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +46: [2023-04-29 11:26:43,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 11:26:43,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 6: [2023-04-29 11:26:43,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +30: [2023-04-29 11:26:43,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +59: [2023-04-29 11:26:43,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +59: [2023-04-29 11:26:43,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 6: [2023-04-29 11:26:43,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 11:26:43,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +59: [2023-04-29 11:26:43,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +30: [2023-04-29 11:26:43,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +30: [2023-04-29 11:26:43,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +30: [2023-04-29 11:26:43,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +49: [2023-04-29 11:26:43,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 11:26:43,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 11:26:43,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +49: [2023-04-29 11:26:43,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 11:26:43,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 11:26:43,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 11:26:43,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +45: [2023-04-29 11:26:43,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 11:26:43,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +42: [2023-04-29 11:26:43,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +30: [2023-04-29 11:26:43,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +42: [2023-04-29 11:26:43,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 11:26:43,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +44: [2023-04-29 11:26:43,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +13: [2023-04-29 11:26:43,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 11:26:43,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +13: [2023-04-29 11:26:43,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +44: [2023-04-29 11:26:43,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +57: [2023-04-29 11:26:43,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +16: [2023-04-29 11:26:43,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +48: [2023-04-29 11:26:43,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +42: [2023-04-29 11:26:43,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 11:26:43,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +49: [2023-04-29 11:26:43,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +49: [2023-04-29 11:26:43,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +61: [2023-04-29 11:26:43,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +61: [2023-04-29 11:26:43,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +13: [2023-04-29 11:26:43,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_00-model_states.pt. +16: [2023-04-29 11:26:43,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +16: [2023-04-29 11:26:43,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +45: [2023-04-29 11:26:43,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +61: [2023-04-29 11:26:43,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +48: [2023-04-29 11:26:43,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 11:26:43,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +44: [2023-04-29 11:26:43,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 11:26:43,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +49: [2023-04-29 11:26:43,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +16: [2023-04-29 11:26:43,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +59: [2023-04-29 11:26:43,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 11:26:43,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 11:26:43,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +57: [2023-04-29 11:26:43,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +20: [2023-04-29 11:26:43,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +46: [2023-04-29 11:26:43,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 11:26:43,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 11:26:43,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +13: [2023-04-29 11:26:43,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +13: [2023-04-29 11:26:43,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +13: [2023-04-29 11:26:43,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +13: [2023-04-29 11:26:43,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt... +49: [2023-04-29 11:26:43,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt... +56: [2023-04-29 11:26:43,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 11:26:43,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 11:26:43,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +46: [2023-04-29 11:26:43,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 11:26:43,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 11:26:43,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 11:26:43,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +20: [2023-04-29 11:26:43,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +42: [2023-04-29 11:26:43,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +35: [2023-04-29 11:26:43,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 11:26:43,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 11:26:43,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 11:26:43,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 11:26:43,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +56: [2023-04-29 11:26:43,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 11:26:43,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +21: [2023-04-29 11:26:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 11:26:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 11:26:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 11:26:43,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +35: [2023-04-29 11:26:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 11:26:43,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +31: [2023-04-29 11:26:43,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 11:26:43,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 11:26:43,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 11:26:43,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +57: [2023-04-29 11:26:43,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +58: [2023-04-29 11:26:43,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +31: [2023-04-29 11:26:43,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +57: [2023-04-29 11:26:43,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 11:26:43,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +48: [2023-04-29 11:26:43,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +48: [2023-04-29 11:26:43,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +17: [2023-04-29 11:26:43,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 11:26:43,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +44: [2023-04-29 11:26:43,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +17: [2023-04-29 11:26:43,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 11:26:43,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 11:26:43,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 11:26:43,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 11:26:43,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 11:26:43,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 11:26:43,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 11:26:43,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 11:26:43,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 11:26:43,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +59: [2023-04-29 11:26:43,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +35: [2023-04-29 11:26:43,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +10: [2023-04-29 11:26:43,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +35: [2023-04-29 11:26:43,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 11:26:43,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +10: [2023-04-29 11:26:43,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 11:26:43,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +35: [2023-04-29 11:26:43,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 11:26:43,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +57: [2023-04-29 11:26:43,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 11:26:43,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 11:26:43,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 11:26:43,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 11:26:43,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +17: [2023-04-29 11:26:43,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +35: [2023-04-29 11:26:43,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 11:26:43,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +17: [2023-04-29 11:26:43,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +49: [2023-04-29 11:26:43,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +10: [2023-04-29 11:26:43,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 11:26:43,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 11:26:43,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 11:26:43,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 11:26:43,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 11:26:43,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 11:26:43,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 11:26:43,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 11:26:43,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +19: [2023-04-29 11:26:43,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +27: [2023-04-29 11:26:43,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +40: [2023-04-29 11:26:43,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +10: [2023-04-29 11:26:43,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 11:26:43,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 11:26:43,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +42: [2023-04-29 11:26:43,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +17: [2023-04-29 11:26:43,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +58: [2023-04-29 11:26:43,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 11:26:43,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 11:26:43,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +10: [2023-04-29 11:26:43,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 0: [2023-04-29 11:26:43,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +19: [2023-04-29 11:26:43,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 0: [2023-04-29 11:26:43,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 11:26:43,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 0: [2023-04-29 11:26:43,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +42: [2023-04-29 11:26:43,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:43,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 11:26:43,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 11:26:43,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 11:26:43,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +48: [2023-04-29 11:26:43,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 11:26:43,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 11:26:43,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 11:26:43,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 11:26:43,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +61: [2023-04-29 11:26:43,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 11:26:43,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +27: [2023-04-29 11:26:43,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 11:26:43,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 11:26:43,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +61: [2023-04-29 11:26:43,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 11:26:43,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +35: [2023-04-29 11:26:43,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 11:26:43,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +57: [2023-04-29 11:26:43,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +40: [2023-04-29 11:26:43,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 11:26:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 11:26:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 11:26:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +35: [2023-04-29 11:26:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 11:26:43,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +48: [2023-04-29 11:26:43,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 4: [2023-04-29 11:26:43,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 11:26:43,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 2: [2023-04-29 11:26:43,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 11:26:43,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 11:26:43,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 11:26:43,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 11:26:43,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +35: [2023-04-29 11:26:43,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +35: [2023-04-29 11:26:43,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 7: [2023-04-29 11:26:43,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 7: [2023-04-29 11:26:43,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +35: [2023-04-29 11:26:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +35: [2023-04-29 11:26:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 7: [2023-04-29 11:26:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 11:26:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 11:26:43,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 11:26:43,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 11:26:43,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 11:26:43,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 2: [2023-04-29 11:26:43,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +57: [2023-04-29 11:26:43,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 11:26:43,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +12: [2023-04-29 11:26:43,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +12: [2023-04-29 11:26:43,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +12: [2023-04-29 11:26:43,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +12: [2023-04-29 11:26:43,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 11:26:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 11:26:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 11:26:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 11:26:43,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 11:26:43,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 11:26:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 11:26:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 11:26:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 11:26:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 11:26:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 11:26:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 11:26:43,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +57: [2023-04-29 11:26:43,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 7: [2023-04-29 11:26:43,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +35: [2023-04-29 11:26:43,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 6: [2023-04-29 11:26:43,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +48: [2023-04-29 11:26:43,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 7: [2023-04-29 11:26:43,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 11:26:43,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +10: [2023-04-29 11:26:43,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +10: [2023-04-29 11:26:43,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 7: [2023-04-29 11:26:43,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +10: [2023-04-29 11:26:43,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +62: [2023-04-29 11:26:43,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +62: [2023-04-29 11:26:43,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +16: [2023-04-29 11:26:43,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +62: [2023-04-29 11:26:43,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +40: [2023-04-29 11:26:43,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 9: [2023-04-29 11:26:43,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +62: [2023-04-29 11:26:43,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. + 6: [2023-04-29 11:26:43,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 6: [2023-04-29 11:26:43,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 11:26:43,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 11:26:43,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 6: [2023-04-29 11:26:43,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 11:26:43,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +16: [2023-04-29 11:26:43,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 11:26:43,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +48: [2023-04-29 11:26:43,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +16: [2023-04-29 11:26:43,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 11:26:43,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 11:26:43,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 11:26:43,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 11:26:43,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 11:26:43,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 11:26:43,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +18: [2023-04-29 11:26:43,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +18: [2023-04-29 11:26:43,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +49: [2023-04-29 11:26:43,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 11:26:43,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +19: [2023-04-29 11:26:43,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +58: [2023-04-29 11:26:43,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +19: [2023-04-29 11:26:43,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +58: [2023-04-29 11:26:43,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +26: [2023-04-29 11:26:43,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +26: [2023-04-29 11:26:43,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +26: [2023-04-29 11:26:43,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +33: [2023-04-29 11:26:43,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +33: [2023-04-29 11:26:43,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +33: [2023-04-29 11:26:43,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +33: [2023-04-29 11:26:43,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +26: [2023-04-29 11:26:43,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +19: [2023-04-29 11:26:44,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +48: [2023-04-29 11:26:44,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 11:26:44,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +40: [2023-04-29 11:26:44,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 11:26:44,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... + 4: [2023-04-29 11:26:44,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 11:26:44,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +15: [2023-04-29 11:26:44,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 11:26:44,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +58: [2023-04-29 11:26:44,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 11:26:44,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 11:26:44,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 11:26:44,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +57: [2023-04-29 11:26:44,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +57: [2023-04-29 11:26:44,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +57: [2023-04-29 11:26:44,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +49: [2023-04-29 11:26:44,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +15: [2023-04-29 11:26:44,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +40: [2023-04-29 11:26:44,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +40: [2023-04-29 11:26:44,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 11:26:44,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +34: [2023-04-29 11:26:44,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +34: [2023-04-29 11:26:44,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +34: [2023-04-29 11:26:44,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +58: [2023-04-29 11:26:44,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 11:26:44,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +58: [2023-04-29 11:26:44,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +58: [2023-04-29 11:26:44,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +58: [2023-04-29 11:26:44,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +15: [2023-04-29 11:26:44,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +49: [2023-04-29 11:26:44,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +15: [2023-04-29 11:26:44,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +49: [2023-04-29 11:26:44,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +46: [2023-04-29 11:26:44,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +46: [2023-04-29 11:26:44,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +46: [2023-04-29 11:26:44,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +46: [2023-04-29 11:26:44,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +32: [2023-04-29 11:26:44,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +32: [2023-04-29 11:26:44,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +58: [2023-04-29 11:26:44,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +44: [2023-04-29 11:26:44,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +44: [2023-04-29 11:26:44,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +15: [2023-04-29 11:26:44,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +44: [2023-04-29 11:26:44,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +32: [2023-04-29 11:26:44,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +12: [2023-04-29 11:26:44,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +12: [2023-04-29 11:26:44,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +12: [2023-04-29 11:26:44,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +12: [2023-04-29 11:26:44,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +32: [2023-04-29 11:26:44,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +10: [2023-04-29 11:26:44,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +62: [2023-04-29 11:26:44,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 11:26:44,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +38: [2023-04-29 11:26:44,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +38: [2023-04-29 11:26:44,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +25: [2023-04-29 11:26:44,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +25: [2023-04-29 11:26:44,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +25: [2023-04-29 11:26:44,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +38: [2023-04-29 11:26:44,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 6: [2023-04-29 11:26:44,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +38: [2023-04-29 11:26:44,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +25: [2023-04-29 11:26:44,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +62: [2023-04-29 11:26:44,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 11:26:44,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 11:26:44,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +10: [2023-04-29 11:26:44,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +44: [2023-04-29 11:26:44,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +44: [2023-04-29 11:26:44,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +26: [2023-04-29 11:26:44,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +10: [2023-04-29 11:26:44,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +10: [2023-04-29 11:26:44,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +35: [2023-04-29 11:26:44,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +11: [2023-04-29 11:26:44,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +33: [2023-04-29 11:26:44,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +17: [2023-04-29 11:26:44,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +33: [2023-04-29 11:26:44,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +33: [2023-04-29 11:26:44,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 11:26:44,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_00-model_states.pt. +33: [2023-04-29 11:26:44,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +15: [2023-04-29 11:26:44,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 11:26:44,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 11:26:44,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 11:26:44,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 11:26:44,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +36: [2023-04-29 11:26:44,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 11:26:44,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 11:26:44,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +27: [2023-04-29 11:26:44,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +36: [2023-04-29 11:26:44,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +26: [2023-04-29 11:26:44,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +35: [2023-04-29 11:26:44,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 11:26:44,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +51: [2023-04-29 11:26:44,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 11:26:44,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 11:26:44,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt... +35: [2023-04-29 11:26:44,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 11:26:44,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +51: [2023-04-29 11:26:44,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +23: [2023-04-29 11:26:44,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +23: [2023-04-29 11:26:44,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +23: [2023-04-29 11:26:44,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +23: [2023-04-29 11:26:44,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +17: [2023-04-29 11:26:44,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 11:26:44,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +34: [2023-04-29 11:26:44,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 11:26:44,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 11:26:44,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +57: [2023-04-29 11:26:44,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +12: [2023-04-29 11:26:44,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +36: [2023-04-29 11:26:44,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 11:26:44,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 11:26:44,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 11:26:44,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 11:26:44,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 11:26:44,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 11:26:44,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 11:26:44,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 11:26:44,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 11:26:44,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 11:26:44,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +51: [2023-04-29 11:26:44,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +32: [2023-04-29 11:26:44,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 11:26:44,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +52: [2023-04-29 11:26:44,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +52: [2023-04-29 11:26:44,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +27: [2023-04-29 11:26:44,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +52: [2023-04-29 11:26:44,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +12: [2023-04-29 11:26:44,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +34: [2023-04-29 11:26:44,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 11:26:44,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +10: [2023-04-29 11:26:44,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 11:26:44,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +12: [2023-04-29 11:26:44,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +15: [2023-04-29 11:26:44,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 11:26:44,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +46: [2023-04-29 11:26:44,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 11:26:44,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 11:26:44,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +25: [2023-04-29 11:26:44,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 11:26:44,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +50: [2023-04-29 11:26:44,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 7: [2023-04-29 11:26:44,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 11:26:44,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +50: [2023-04-29 11:26:44,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +27: [2023-04-29 11:26:44,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 11:26:44,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 11:26:44,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +32: [2023-04-29 11:26:44,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 11:26:44,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +25: [2023-04-29 11:26:44,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 11:26:44,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +38: [2023-04-29 11:26:44,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 11:26:44,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 11:26:44,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 11:26:44,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +11: [2023-04-29 11:26:44,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +38: [2023-04-29 11:26:44,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +18: [2023-04-29 11:26:44,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +17: [2023-04-29 11:26:44,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 1: [2023-04-29 11:26:44,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 1: [2023-04-29 11:26:44,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 1: [2023-04-29 11:26:44,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +35: [2023-04-29 11:26:44,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +15: [2023-04-29 11:26:44,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 11:26:44,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 11:26:44,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +32: [2023-04-29 11:26:44,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +16: [2023-04-29 11:26:44,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +54: [2023-04-29 11:26:44,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 11:26:44,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 11:26:44,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +17: [2023-04-29 11:26:44,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 11:26:44,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 11:26:44,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +54: [2023-04-29 11:26:44,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +12: [2023-04-29 11:26:44,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 11:26:44,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 11:26:44,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +54: [2023-04-29 11:26:44,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +19: [2023-04-29 11:26:44,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +54: [2023-04-29 11:26:44,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 11:26:44,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 11:26:44,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 11:26:44,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 11:26:44,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +23: [2023-04-29 11:26:44,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +35: [2023-04-29 11:26:44,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +23: [2023-04-29 11:26:44,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +23: [2023-04-29 11:26:44,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +35: [2023-04-29 11:26:44,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +17: [2023-04-29 11:26:44,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 11:26:44,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 11:26:44,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +19: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +19: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +13: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 11:26:44,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 11:26:44,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 11:26:44,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +52: [2023-04-29 11:26:44,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +15: [2023-04-29 11:26:44,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +52: [2023-04-29 11:26:44,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +15: [2023-04-29 11:26:44,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +52: [2023-04-29 11:26:44,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 11:26:44,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +11: [2023-04-29 11:26:44,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +42: [2023-04-29 11:26:44,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +42: [2023-04-29 11:26:44,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +42: [2023-04-29 11:26:44,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 11:26:44,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 11:26:44,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 11:26:44,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +13: [2023-04-29 11:26:44,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +50: [2023-04-29 11:26:44,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 11:26:44,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 11:26:44,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 11:26:44,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 0: [2023-04-29 11:26:44,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 11:26:44,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 11:26:44,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +13: [2023-04-29 11:26:44,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 11:26:44,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +13: [2023-04-29 11:26:44,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 11:26:44,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 11:26:44,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 11:26:44,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 11:26:44,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 11:26:44,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 11:26:44,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +29: [2023-04-29 11:26:44,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +29: [2023-04-29 11:26:44,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +29: [2023-04-29 11:26:44,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 11:26:44,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +50: [2023-04-29 11:26:44,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +62: [2023-04-29 11:26:44,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 11:26:44,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +39: [2023-04-29 11:26:44,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +29: [2023-04-29 11:26:44,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +39: [2023-04-29 11:26:44,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +39: [2023-04-29 11:26:44,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 11:26:44,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 11:26:44,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 11:26:44,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +16: [2023-04-29 11:26:44,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +35: [2023-04-29 11:26:44,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 11:26:44,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +18: [2023-04-29 11:26:44,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 11:26:44,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +29: [2023-04-29 11:26:44,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +18: [2023-04-29 11:26:44,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 11:26:44,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +32: [2023-04-29 11:26:44,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +29: [2023-04-29 11:26:44,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +29: [2023-04-29 11:26:44,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +29: [2023-04-29 11:26:44,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +43: [2023-04-29 11:26:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 11:26:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 11:26:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 11:26:44,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +19: [2023-04-29 11:26:44,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +62: [2023-04-29 11:26:44,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +12: [2023-04-29 11:26:44,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +60: [2023-04-29 11:26:44,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +60: [2023-04-29 11:26:44,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +12: [2023-04-29 11:26:44,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +43: [2023-04-29 11:26:44,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 11:26:44,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 11:26:44,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 11:26:44,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 11:26:44,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 11:26:44,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 11:26:44,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 11:26:44,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 11:26:44,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +60: [2023-04-29 11:26:44,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +32: [2023-04-29 11:26:44,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +10: [2023-04-29 11:26:44,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +32: [2023-04-29 11:26:44,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 11:26:44,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 11:26:44,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +40: [2023-04-29 11:26:44,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +40: [2023-04-29 11:26:44,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +40: [2023-04-29 11:26:44,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +56: [2023-04-29 11:26:44,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +56: [2023-04-29 11:26:44,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +63: [2023-04-29 11:26:44,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +63: [2023-04-29 11:26:44,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +16: [2023-04-29 11:26:44,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +63: [2023-04-29 11:26:44,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +18: [2023-04-29 11:26:44,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +63: [2023-04-29 11:26:44,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +56: [2023-04-29 11:26:44,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +10: [2023-04-29 11:26:44,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +56: [2023-04-29 11:26:44,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +57: [2023-04-29 11:26:44,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +37: [2023-04-29 11:26:44,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +37: [2023-04-29 11:26:44,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +37: [2023-04-29 11:26:44,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 11:26:44,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +37: [2023-04-29 11:26:44,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +62: [2023-04-29 11:26:44,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +10: [2023-04-29 11:26:44,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 7: [2023-04-29 11:26:44,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +47: [2023-04-29 11:26:44,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +47: [2023-04-29 11:26:44,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 7: [2023-04-29 11:26:44,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 11:26:44,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 11:26:44,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 11:26:44,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 11:26:44,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 11:26:44,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 11:26:44,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 11:26:44,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +46: [2023-04-29 11:26:44,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 11:26:44,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +47: [2023-04-29 11:26:44,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +16: [2023-04-29 11:26:44,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 11:26:44,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +57: [2023-04-29 11:26:44,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +36: [2023-04-29 11:26:44,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +23: [2023-04-29 11:26:44,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 11:26:44,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 11:26:44,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 11:26:44,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +42: [2023-04-29 11:26:44,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +34: [2023-04-29 11:26:44,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 11:26:44,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 11:26:44,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 11:26:44,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 11:26:44,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 11:26:44,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +22: [2023-04-29 11:26:44,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 11:26:44,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +12: [2023-04-29 11:26:44,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 5: [2023-04-29 11:26:44,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +39: [2023-04-29 11:26:44,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +36: [2023-04-29 11:26:44,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +22: [2023-04-29 11:26:44,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +57: [2023-04-29 11:26:44,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 11:26:44,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 11:26:44,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 11:26:44,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +46: [2023-04-29 11:26:44,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +10: [2023-04-29 11:26:44,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +39: [2023-04-29 11:26:44,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +38: [2023-04-29 11:26:44,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +46: [2023-04-29 11:26:44,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +22: [2023-04-29 11:26:44,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +32: [2023-04-29 11:26:44,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 11:26:44,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 11:26:44,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +34: [2023-04-29 11:26:44,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +51: [2023-04-29 11:26:44,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +12: [2023-04-29 11:26:44,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +23: [2023-04-29 11:26:44,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +34: [2023-04-29 11:26:44,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 11:26:44,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 2: [2023-04-29 11:26:44,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 2: [2023-04-29 11:26:44,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +23: [2023-04-29 11:26:44,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +23: [2023-04-29 11:26:44,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +46: [2023-04-29 11:26:44,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +51: [2023-04-29 11:26:44,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +12: [2023-04-29 11:26:44,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 11:26:44,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +41: [2023-04-29 11:26:44,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +60: [2023-04-29 11:26:44,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 11:26:44,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +34: [2023-04-29 11:26:44,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +41: [2023-04-29 11:26:44,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +41: [2023-04-29 11:26:44,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +46: [2023-04-29 11:26:44,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +41: [2023-04-29 11:26:44,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +32: [2023-04-29 11:26:44,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +60: [2023-04-29 11:26:44,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 11:26:44,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 11:26:44,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +38: [2023-04-29 11:26:44,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +57: [2023-04-29 11:26:44,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 8: [2023-04-29 11:26:44,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +32: [2023-04-29 11:26:44,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 11:26:44,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 8: [2023-04-29 11:26:44,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +46: [2023-04-29 11:26:44,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +34: [2023-04-29 11:26:44,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +36: [2023-04-29 11:26:44,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 11:26:44,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 11:26:44,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 11:26:44,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 11:26:44,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 11:26:44,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 11:26:44,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 11:26:44,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +38: [2023-04-29 11:26:44,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 11:26:44,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 11:26:44,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 11:26:44,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 11:26:44,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 11:26:44,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +34: [2023-04-29 11:26:44,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +10: [2023-04-29 11:26:44,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +36: [2023-04-29 11:26:44,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +36: [2023-04-29 11:26:44,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +54: [2023-04-29 11:26:44,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +36: [2023-04-29 11:26:44,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 11:26:44,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +40: [2023-04-29 11:26:44,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +10: [2023-04-29 11:26:44,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +10: [2023-04-29 11:26:44,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +40: [2023-04-29 11:26:44,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 11:26:44,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +61: [2023-04-29 11:26:44,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 11:26:44,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 11:26:44,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +38: [2023-04-29 11:26:44,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +38: [2023-04-29 11:26:44,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +61: [2023-04-29 11:26:44,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +61: [2023-04-29 11:26:44,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 11:26:44,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +56: [2023-04-29 11:26:44,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 11:26:44,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +47: [2023-04-29 11:26:44,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +61: [2023-04-29 11:26:44,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 8: [2023-04-29 11:26:44,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +61: [2023-04-29 11:26:44,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +63: [2023-04-29 11:26:44,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 11:26:44,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +22: [2023-04-29 11:26:44,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +22: [2023-04-29 11:26:44,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 8: [2023-04-29 11:26:44,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +61: [2023-04-29 11:26:44,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 11:26:44,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... + 8: [2023-04-29 11:26:44,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +36: [2023-04-29 11:26:44,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +63: [2023-04-29 11:26:44,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +12: [2023-04-29 11:26:44,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +12: [2023-04-29 11:26:44,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 11:26:44,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 11:26:44,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 11:26:44,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +47: [2023-04-29 11:26:44,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 11:26:44,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 11:26:44,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 11:26:44,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 11:26:44,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 11:26:44,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +24: [2023-04-29 11:26:44,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 11:26:44,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +37: [2023-04-29 11:26:44,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +56: [2023-04-29 11:26:44,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 11:26:44,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +37: [2023-04-29 11:26:44,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +10: [2023-04-29 11:26:44,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +36: [2023-04-29 11:26:44,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +37: [2023-04-29 11:26:44,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +10: [2023-04-29 11:26:44,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +47: [2023-04-29 11:26:44,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +10: [2023-04-29 11:26:44,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +56: [2023-04-29 11:26:44,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 11:26:44,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +23: [2023-04-29 11:26:44,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 11:26:44,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +63: [2023-04-29 11:26:44,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +24: [2023-04-29 11:26:44,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +24: [2023-04-29 11:26:44,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 11:26:44,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +12: [2023-04-29 11:26:44,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +12: [2023-04-29 11:26:44,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +13: [2023-04-29 11:26:44,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +54: [2023-04-29 11:26:44,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 11:26:44,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +51: [2023-04-29 11:26:44,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +24: [2023-04-29 11:26:44,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 11:26:44,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 11:26:44,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +24: [2023-04-29 11:26:44,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +24: [2023-04-29 11:26:44,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +54: [2023-04-29 11:26:44,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 11:26:44,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +23: [2023-04-29 11:26:44,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +23: [2023-04-29 11:26:44,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +13: [2023-04-29 11:26:44,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 11:26:44,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 11:26:44,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +62: [2023-04-29 11:26:44,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 11:26:44,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +55: [2023-04-29 11:26:44,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +55: [2023-04-29 11:26:44,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +51: [2023-04-29 11:26:44,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +55: [2023-04-29 11:26:44,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +41: [2023-04-29 11:26:44,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +23: [2023-04-29 11:26:44,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +55: [2023-04-29 11:26:44,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 1: [2023-04-29 11:26:44,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 11:26:44,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 11:26:44,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +62: [2023-04-29 11:26:44,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 11:26:44,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +23: [2023-04-29 11:26:44,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +51: [2023-04-29 11:26:44,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 11:26:44,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 11:26:44,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +14: [2023-04-29 11:26:44,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +14: [2023-04-29 11:26:44,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +41: [2023-04-29 11:26:44,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +14: [2023-04-29 11:26:44,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +32: [2023-04-29 11:26:44,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 11:26:44,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 2: [2023-04-29 11:26:44,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +50: [2023-04-29 11:26:44,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 11:26:44,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 11:26:44,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +29: [2023-04-29 11:26:44,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +36: [2023-04-29 11:26:44,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +41: [2023-04-29 11:26:44,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +32: [2023-04-29 11:26:44,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +36: [2023-04-29 11:26:44,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +50: [2023-04-29 11:26:44,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +23: [2023-04-29 11:26:44,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +13: [2023-04-29 11:26:44,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 11:26:44,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 11:26:44,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 1: [2023-04-29 11:26:44,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +36: [2023-04-29 11:26:44,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 3: [2023-04-29 11:26:44,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 6: [2023-04-29 11:26:44,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 6: [2023-04-29 11:26:44,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 6: [2023-04-29 11:26:44,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 6: [2023-04-29 11:26:44,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +50: [2023-04-29 11:26:44,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +36: [2023-04-29 11:26:44,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +36: [2023-04-29 11:26:44,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +32: [2023-04-29 11:26:44,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +43: [2023-04-29 11:26:44,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +63: [2023-04-29 11:26:44,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +63: [2023-04-29 11:26:44,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +22: [2023-04-29 11:26:44,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 11:26:44,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 1: [2023-04-29 11:26:44,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +63: [2023-04-29 11:26:44,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 11:26:44,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 11:26:44,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +54: [2023-04-29 11:26:44,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 11:26:44,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +43: [2023-04-29 11:26:44,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +29: [2023-04-29 11:26:44,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +42: [2023-04-29 11:26:44,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +43: [2023-04-29 11:26:44,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 11:26:44,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +63: [2023-04-29 11:26:44,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 11:26:44,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 11:26:44,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +63: [2023-04-29 11:26:44,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 11:26:44,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +22: [2023-04-29 11:26:44,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +54: [2023-04-29 11:26:44,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +29: [2023-04-29 11:26:44,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +29: [2023-04-29 11:26:44,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +54: [2023-04-29 11:26:44,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +54: [2023-04-29 11:26:44,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +39: [2023-04-29 11:26:44,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 11:26:44,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +54: [2023-04-29 11:26:44,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 11:26:44,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +21: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +63: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +53: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +21: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +13: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +53: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +21: [2023-04-29 11:26:44,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +21: [2023-04-29 11:26:44,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +39: [2023-04-29 11:26:44,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +55: [2023-04-29 11:26:44,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +55: [2023-04-29 11:26:44,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 11:26:44,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 11:26:44,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 11:26:44,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +14: [2023-04-29 11:26:44,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +62: [2023-04-29 11:26:44,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 11:26:44,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 11:26:44,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 11:26:44,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 11:26:44,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +14: [2023-04-29 11:26:44,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +53: [2023-04-29 11:26:44,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 11:26:44,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +53: [2023-04-29 11:26:44,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +14: [2023-04-29 11:26:44,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +53: [2023-04-29 11:26:44,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +53: [2023-04-29 11:26:44,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 11:26:44,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:44,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 11:26:44,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 11:26:44,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +29: [2023-04-29 11:26:44,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 11:26:44,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +53: [2023-04-29 11:26:44,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +55: [2023-04-29 11:26:44,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +53: [2023-04-29 11:26:44,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +53: [2023-04-29 11:26:44,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +53: [2023-04-29 11:26:44,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 11:26:44,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +51: [2023-04-29 11:26:44,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +39: [2023-04-29 11:26:44,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 11:26:44,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 11:26:44,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +51: [2023-04-29 11:26:44,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +23: [2023-04-29 11:26:44,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +55: [2023-04-29 11:26:44,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +32: [2023-04-29 11:26:44,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 11:26:44,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +39: [2023-04-29 11:26:44,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +13: [2023-04-29 11:26:44,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +60: [2023-04-29 11:26:44,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 11:26:44,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +23: [2023-04-29 11:26:44,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 11:26:44,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +39: [2023-04-29 11:26:44,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +39: [2023-04-29 11:26:44,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +42: [2023-04-29 11:26:44,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +42: [2023-04-29 11:26:44,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +55: [2023-04-29 11:26:44,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +55: [2023-04-29 11:26:44,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +42: [2023-04-29 11:26:44,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 1: [2023-04-29 11:26:44,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +43: [2023-04-29 11:26:44,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +23: [2023-04-29 11:26:44,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 11:26:44,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +60: [2023-04-29 11:26:44,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +55: [2023-04-29 11:26:44,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +55: [2023-04-29 11:26:44,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 11:26:44,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 11:26:44,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 11:26:44,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 11:26:44,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +43: [2023-04-29 11:26:44,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 11:26:44,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +47: [2023-04-29 11:26:44,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 11:26:44,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 11:26:44,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 11:26:44,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +60: [2023-04-29 11:26:44,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +60: [2023-04-29 11:26:44,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 11:26:44,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 11:26:44,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +39: [2023-04-29 11:26:44,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +29: [2023-04-29 11:26:44,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +39: [2023-04-29 11:26:44,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +48: [2023-04-29 11:26:44,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +48: [2023-04-29 11:26:44,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +48: [2023-04-29 11:26:44,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +48: [2023-04-29 11:26:44,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +60: [2023-04-29 11:26:44,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 11:26:44,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 11:26:44,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +40: [2023-04-29 11:26:44,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +61: [2023-04-29 11:26:44,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +27: [2023-04-29 11:26:44,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +27: [2023-04-29 11:26:44,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +55: [2023-04-29 11:26:44,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +27: [2023-04-29 11:26:44,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +56: [2023-04-29 11:26:44,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +27: [2023-04-29 11:26:44,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +43: [2023-04-29 11:26:44,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 11:26:44,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +43: [2023-04-29 11:26:44,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 11:26:44,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 11:26:44,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 11:26:44,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +17: [2023-04-29 11:26:44,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +17: [2023-04-29 11:26:44,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +40: [2023-04-29 11:26:44,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +56: [2023-04-29 11:26:44,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 11:26:44,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +17: [2023-04-29 11:26:44,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +54: [2023-04-29 11:26:44,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 11:26:44,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +17: [2023-04-29 11:26:44,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +37: [2023-04-29 11:26:44,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +21: [2023-04-29 11:26:44,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +47: [2023-04-29 11:26:44,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +47: [2023-04-29 11:26:44,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +37: [2023-04-29 11:26:44,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 11:26:44,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +24: [2023-04-29 11:26:44,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +61: [2023-04-29 11:26:44,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 11:26:44,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +40: [2023-04-29 11:26:44,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +40: [2023-04-29 11:26:44,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +40: [2023-04-29 11:26:44,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +24: [2023-04-29 11:26:44,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +56: [2023-04-29 11:26:44,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +54: [2023-04-29 11:26:44,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 11:26:44,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +54: [2023-04-29 11:26:44,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +29: [2023-04-29 11:26:44,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +40: [2023-04-29 11:26:44,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +37: [2023-04-29 11:26:44,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +22: [2023-04-29 11:26:44,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +56: [2023-04-29 11:26:44,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +60: [2023-04-29 11:26:44,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +47: [2023-04-29 11:26:44,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +29: [2023-04-29 11:26:44,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +37: [2023-04-29 11:26:44,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +56: [2023-04-29 11:26:44,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +21: [2023-04-29 11:26:44,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +21: [2023-04-29 11:26:44,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +37: [2023-04-29 11:26:44,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +21: [2023-04-29 11:26:44,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 11:26:44,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +47: [2023-04-29 11:26:44,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 8: [2023-04-29 11:26:44,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +24: [2023-04-29 11:26:44,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +24: [2023-04-29 11:26:44,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +37: [2023-04-29 11:26:44,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +63: [2023-04-29 11:26:44,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +51: [2023-04-29 11:26:44,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +63: [2023-04-29 11:26:44,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +63: [2023-04-29 11:26:44,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +51: [2023-04-29 11:26:44,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 11:26:44,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 11:26:44,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +51: [2023-04-29 11:26:44,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +47: [2023-04-29 11:26:44,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +37: [2023-04-29 11:26:44,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +56: [2023-04-29 11:26:44,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +43: [2023-04-29 11:26:44,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +43: [2023-04-29 11:26:44,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +43: [2023-04-29 11:26:44,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +43: [2023-04-29 11:26:44,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +37: [2023-04-29 11:26:44,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +63: [2023-04-29 11:26:44,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +22: [2023-04-29 11:26:44,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +63: [2023-04-29 11:26:44,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +63: [2023-04-29 11:26:44,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 8: [2023-04-29 11:26:44,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +36: [2023-04-29 11:26:44,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +23: [2023-04-29 11:26:44,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 11:26:44,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 11:26:44,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +48: [2023-04-29 11:26:44,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +26: [2023-04-29 11:26:44,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 11:26:44,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 11:26:44,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 11:26:44,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 11:26:44,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +23: [2023-04-29 11:26:44,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +32: [2023-04-29 11:26:44,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +26: [2023-04-29 11:26:44,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +32: [2023-04-29 11:26:44,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +23: [2023-04-29 11:26:44,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +63: [2023-04-29 11:26:44,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +61: [2023-04-29 11:26:44,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 11:26:44,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +36: [2023-04-29 11:26:44,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +36: [2023-04-29 11:26:44,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +34: [2023-04-29 11:26:44,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 11:26:44,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +48: [2023-04-29 11:26:44,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 11:26:44,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 11:26:44,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +32: [2023-04-29 11:26:44,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +26: [2023-04-29 11:26:44,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +17: [2023-04-29 11:26:44,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +23: [2023-04-29 11:26:44,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +45: [2023-04-29 11:26:44,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +26: [2023-04-29 11:26:44,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +17: [2023-04-29 11:26:44,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +45: [2023-04-29 11:26:44,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +26: [2023-04-29 11:26:44,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 11:26:44,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 11:26:44,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +61: [2023-04-29 11:26:44,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 11:26:44,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 11:26:44,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +36: [2023-04-29 11:26:44,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +34: [2023-04-29 11:26:44,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 11:26:44,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +48: [2023-04-29 11:26:44,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 11:26:44,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +19: [2023-04-29 11:26:44,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 11:26:44,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 11:26:44,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 11:26:44,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 11:26:44,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 11:26:44,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 11:26:44,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +16: [2023-04-29 11:26:44,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +16: [2023-04-29 11:26:44,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 2: [2023-04-29 11:26:44,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +59: [2023-04-29 11:26:44,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +59: [2023-04-29 11:26:44,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +59: [2023-04-29 11:26:44,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +17: [2023-04-29 11:26:44,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +59: [2023-04-29 11:26:44,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +36: [2023-04-29 11:26:44,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +36: [2023-04-29 11:26:44,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +19: [2023-04-29 11:26:44,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 11:26:44,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +34: [2023-04-29 11:26:44,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +16: [2023-04-29 11:26:44,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +19: [2023-04-29 11:26:44,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +61: [2023-04-29 11:26:44,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +26: [2023-04-29 11:26:44,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +26: [2023-04-29 11:26:44,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +26: [2023-04-29 11:26:44,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +34: [2023-04-29 11:26:44,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 11:26:44,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +53: [2023-04-29 11:26:44,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +34: [2023-04-29 11:26:44,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +63: [2023-04-29 11:26:44,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +19: [2023-04-29 11:26:44,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 11:26:44,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +36: [2023-04-29 11:26:44,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 11:26:44,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +19: [2023-04-29 11:26:44,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +34: [2023-04-29 11:26:44,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +19: [2023-04-29 11:26:44,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +44: [2023-04-29 11:26:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +44: [2023-04-29 11:26:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +45: [2023-04-29 11:26:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +24: [2023-04-29 11:26:44,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 11:26:44,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +39: [2023-04-29 11:26:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 11:26:44,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +63: [2023-04-29 11:26:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 11:26:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +35: [2023-04-29 11:26:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +35: [2023-04-29 11:26:44,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +35: [2023-04-29 11:26:44,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +44: [2023-04-29 11:26:44,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +45: [2023-04-29 11:26:44,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 11:26:44,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 2: [2023-04-29 11:26:44,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 2: [2023-04-29 11:26:44,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +39: [2023-04-29 11:26:44,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 11:26:44,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 11:26:44,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 11:26:44,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +22: [2023-04-29 11:26:44,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 11:26:44,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +36: [2023-04-29 11:26:44,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +22: [2023-04-29 11:26:44,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +45: [2023-04-29 11:26:44,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 11:26:44,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +55: [2023-04-29 11:26:44,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 11:26:44,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 11:26:44,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +43: [2023-04-29 11:26:44,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +53: [2023-04-29 11:26:44,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 11:26:44,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +49: [2023-04-29 11:26:44,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 5: [2023-04-29 11:26:44,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +49: [2023-04-29 11:26:44,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. +49: [2023-04-29 11:26:44,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 5: [2023-04-29 11:26:44,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +49: [2023-04-29 11:26:44,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_29-model_01-model_states.pt. + 5: [2023-04-29 11:26:44,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +45: [2023-04-29 11:26:44,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +22: [2023-04-29 11:26:44,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +22: [2023-04-29 11:26:44,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 6: [2023-04-29 11:26:44,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 11:26:44,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 11:26:44,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 11:26:44,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 11:26:44,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 11:26:44,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +39: [2023-04-29 11:26:44,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +31: [2023-04-29 11:26:44,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 11:26:44,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 11:26:44,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +55: [2023-04-29 11:26:44,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +25: [2023-04-29 11:26:44,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 11:26:44,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 11:26:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 11:26:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 11:26:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 11:26:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 11:26:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 11:26:44,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +53: [2023-04-29 11:26:44,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 11:26:44,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 11:26:44,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +58: [2023-04-29 11:26:44,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +58: [2023-04-29 11:26:44,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +58: [2023-04-29 11:26:44,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +55: [2023-04-29 11:26:44,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 11:26:44,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 5: [2023-04-29 11:26:44,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 5: [2023-04-29 11:26:44,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +31: [2023-04-29 11:26:44,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 11:26:44,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 5: [2023-04-29 11:26:44,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 11:26:44,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +25: [2023-04-29 11:26:44,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 11:26:44,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +52: [2023-04-29 11:26:44,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 11:26:44,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 11:26:44,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 11:26:44,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 11:26:44,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 11:26:44,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 11:26:44,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +31: [2023-04-29 11:26:44,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +52: [2023-04-29 11:26:44,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +25: [2023-04-29 11:26:44,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 11:26:44,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 5: [2023-04-29 11:26:44,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +31: [2023-04-29 11:26:44,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +25: [2023-04-29 11:26:44,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +31: [2023-04-29 11:26:44,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 6: [2023-04-29 11:26:44,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +63: [2023-04-29 11:26:44,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 11:26:44,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +63: [2023-04-29 11:26:44,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +25: [2023-04-29 11:26:44,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 11:26:44,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +25: [2023-04-29 11:26:44,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +25: [2023-04-29 11:26:44,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +25: [2023-04-29 11:26:44,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +45: [2023-04-29 11:26:44,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +39: [2023-04-29 11:26:44,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 11:26:44,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 11:26:44,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +59: [2023-04-29 11:26:44,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 11:26:44,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 11:26:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +52: [2023-04-29 11:26:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +52: [2023-04-29 11:26:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 11:26:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... + 6: [2023-04-29 11:26:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +52: [2023-04-29 11:26:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 11:26:44,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +52: [2023-04-29 11:26:44,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +45: [2023-04-29 11:26:44,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +63: [2023-04-29 11:26:44,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 11:26:44,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 11:26:44,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 11:26:44,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 11:26:44,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +53: [2023-04-29 11:26:44,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 11:26:44,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +59: [2023-04-29 11:26:44,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +28: [2023-04-29 11:26:44,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 11:26:44,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 11:26:44,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 11:26:44,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 11:26:44,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +45: [2023-04-29 11:26:44,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +22: [2023-04-29 11:26:44,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 11:26:44,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +11: [2023-04-29 11:26:44,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +11: [2023-04-29 11:26:44,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +22: [2023-04-29 11:26:44,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +54: [2023-04-29 11:26:44,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +55: [2023-04-29 11:26:44,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 11:26:44,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 11:26:44,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +44: [2023-04-29 11:26:44,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 11:26:44,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +44: [2023-04-29 11:26:44,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +35: [2023-04-29 11:26:44,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 11:26:44,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +28: [2023-04-29 11:26:44,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +28: [2023-04-29 11:26:44,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +28: [2023-04-29 11:26:44,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +35: [2023-04-29 11:26:44,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +29: [2023-04-29 11:26:44,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +29: [2023-04-29 11:26:44,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +29: [2023-04-29 11:26:44,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +29: [2023-04-29 11:26:44,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +39: [2023-04-29 11:26:44,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 11:26:44,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 11:26:44,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 11:26:44,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 11:26:44,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 11:26:44,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +21: [2023-04-29 11:26:44,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +60: [2023-04-29 11:26:44,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 11:26:44,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 11:26:44,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 11:26:44,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 11:26:44,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 11:26:44,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 11:26:44,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +28: [2023-04-29 11:26:44,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +22: [2023-04-29 11:26:44,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +35: [2023-04-29 11:26:44,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +35: [2023-04-29 11:26:44,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 4: [2023-04-29 11:26:44,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. + 4: [2023-04-29 11:26:44,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +55: [2023-04-29 11:26:44,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +49: [2023-04-29 11:26:44,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +60: [2023-04-29 11:26:44,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 11:26:44,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 11:26:44,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +49: [2023-04-29 11:26:44,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +49: [2023-04-29 11:26:44,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +60: [2023-04-29 11:26:44,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +22: [2023-04-29 11:26:44,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +33: [2023-04-29 11:26:44,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +39: [2023-04-29 11:26:44,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 11:26:44,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +53: [2023-04-29 11:26:44,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +21: [2023-04-29 11:26:44,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +54: [2023-04-29 11:26:44,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +30: [2023-04-29 11:26:44,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +30: [2023-04-29 11:26:44,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +30: [2023-04-29 11:26:44,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +33: [2023-04-29 11:26:44,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +30: [2023-04-29 11:26:44,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +33: [2023-04-29 11:26:44,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 11:26:44,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +37: [2023-04-29 11:26:44,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 11:26:44,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 11:26:44,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 11:26:44,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 11:26:44,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +49: [2023-04-29 11:26:44,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt... +33: [2023-04-29 11:26:44,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +55: [2023-04-29 11:26:44,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 11:26:44,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +33: [2023-04-29 11:26:44,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +21: [2023-04-29 11:26:44,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 11:26:44,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +28: [2023-04-29 11:26:44,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +28: [2023-04-29 11:26:44,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +28: [2023-04-29 11:26:44,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +55: [2023-04-29 11:26:44,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +55: [2023-04-29 11:26:44,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 11:26:44,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +21: [2023-04-29 11:26:44,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +51: [2023-04-29 11:26:44,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +55: [2023-04-29 11:26:44,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +58: [2023-04-29 11:26:44,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +58: [2023-04-29 11:26:44,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 11:26:44,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +30: [2023-04-29 11:26:44,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 11:26:44,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 11:26:44,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +53: [2023-04-29 11:26:44,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 11:26:44,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +21: [2023-04-29 11:26:44,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +37: [2023-04-29 11:26:44,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 11:26:44,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 11:26:44,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 11:26:44,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +30: [2023-04-29 11:26:44,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +55: [2023-04-29 11:26:44,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +51: [2023-04-29 11:26:44,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +58: [2023-04-29 11:26:44,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 11:26:44,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +17: [2023-04-29 11:26:44,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 11:26:44,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +39: [2023-04-29 11:26:44,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +11: [2023-04-29 11:26:44,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +51: [2023-04-29 11:26:44,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +14: [2023-04-29 11:26:44,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 11:26:44,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 11:26:44,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 11:26:44,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +21: [2023-04-29 11:26:44,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +14: [2023-04-29 11:26:44,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 11:26:44,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 11:26:44,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +13: [2023-04-29 11:26:44,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +60: [2023-04-29 11:26:44,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 11:26:44,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +14: [2023-04-29 11:26:44,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 11:26:44,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 11:26:44,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +63: [2023-04-29 11:26:44,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +14: [2023-04-29 11:26:44,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 11:26:44,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_07-model_01-model_states.pt. +30: [2023-04-29 11:26:44,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +63: [2023-04-29 11:26:44,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +17: [2023-04-29 11:26:44,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +21: [2023-04-29 11:26:44,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +30: [2023-04-29 11:26:44,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 11:26:44,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +55: [2023-04-29 11:26:44,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +21: [2023-04-29 11:26:44,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +30: [2023-04-29 11:26:44,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 11:26:44,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 11:26:44,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +27: [2023-04-29 11:26:44,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +27: [2023-04-29 11:26:44,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 11:26:44,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 11:26:44,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +14: [2023-04-29 11:26:44,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +51: [2023-04-29 11:26:44,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +55: [2023-04-29 11:26:44,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +17: [2023-04-29 11:26:44,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 9: [2023-04-29 11:26:44,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 9: [2023-04-29 11:26:44,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 9: [2023-04-29 11:26:44,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 9: [2023-04-29 11:26:44,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +17: [2023-04-29 11:26:44,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 11:26:44,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +55: [2023-04-29 11:26:44,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +17: [2023-04-29 11:26:44,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +29: [2023-04-29 11:26:44,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +29: [2023-04-29 11:26:44,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +27: [2023-04-29 11:26:44,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +29: [2023-04-29 11:26:44,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +34: [2023-04-29 11:26:44,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +27: [2023-04-29 11:26:44,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +11: [2023-04-29 11:26:44,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 11:26:44,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +26: [2023-04-29 11:26:44,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +27: [2023-04-29 11:26:44,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 4: [2023-04-29 11:26:44,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 11:26:44,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 11:26:44,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 11:26:44,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +21: [2023-04-29 11:26:44,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 11:26:44,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +14: [2023-04-29 11:26:44,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +43: [2023-04-29 11:26:44,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +21: [2023-04-29 11:26:44,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 11:26:44,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +29: [2023-04-29 11:26:44,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +21: [2023-04-29 11:26:44,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 11:26:44,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +43: [2023-04-29 11:26:44,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +17: [2023-04-29 11:26:44,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 11:26:44,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +25: [2023-04-29 11:26:44,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +11: [2023-04-29 11:26:44,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +30: [2023-04-29 11:26:44,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +30: [2023-04-29 11:26:44,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +60: [2023-04-29 11:26:44,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +30: [2023-04-29 11:26:44,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +19: [2023-04-29 11:26:44,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 11:26:44,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 11:26:44,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +11: [2023-04-29 11:26:44,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +43: [2023-04-29 11:26:44,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +21: [2023-04-29 11:26:44,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +34: [2023-04-29 11:26:44,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +21: [2023-04-29 11:26:44,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 11:26:44,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +43: [2023-04-29 11:26:44,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +21: [2023-04-29 11:26:44,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 11:26:44,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +60: [2023-04-29 11:26:44,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +60: [2023-04-29 11:26:44,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +19: [2023-04-29 11:26:44,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +55: [2023-04-29 11:26:44,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +31: [2023-04-29 11:26:44,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 11:26:44,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +26: [2023-04-29 11:26:44,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +34: [2023-04-29 11:26:44,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +28: [2023-04-29 11:26:44,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +28: [2023-04-29 11:26:44,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +28: [2023-04-29 11:26:44,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +43: [2023-04-29 11:26:44,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +13: [2023-04-29 11:26:44,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 11:26:44,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +13: [2023-04-29 11:26:44,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +45: [2023-04-29 11:26:44,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +25: [2023-04-29 11:26:44,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +34: [2023-04-29 11:26:44,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +45: [2023-04-29 11:26:44,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +13: [2023-04-29 11:26:44,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +43: [2023-04-29 11:26:44,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +43: [2023-04-29 11:26:44,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 11:26:44,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +25: [2023-04-29 11:26:44,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +25: [2023-04-29 11:26:44,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +45: [2023-04-29 11:26:44,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +31: [2023-04-29 11:26:44,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +31: [2023-04-29 11:26:44,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 11:26:44,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +34: [2023-04-29 11:26:44,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +26: [2023-04-29 11:26:44,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +45: [2023-04-29 11:26:44,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +33: [2023-04-29 11:26:44,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +43: [2023-04-29 11:26:44,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +52: [2023-04-29 11:26:44,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 11:26:44,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +55: [2023-04-29 11:26:44,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 11:26:44,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 11:26:44,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 11:26:44,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 11:26:44,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +16: [2023-04-29 11:26:44,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +18: [2023-04-29 11:26:44,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +18: [2023-04-29 11:26:44,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +18: [2023-04-29 11:26:44,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +18: [2023-04-29 11:26:44,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +19: [2023-04-29 11:26:44,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 11:26:44,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +47: [2023-04-29 11:26:44,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 11:26:44,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 11:26:44,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +52: [2023-04-29 11:26:44,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +44: [2023-04-29 11:26:44,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +44: [2023-04-29 11:26:44,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 11:26:44,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +19: [2023-04-29 11:26:44,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +44: [2023-04-29 11:26:44,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +16: [2023-04-29 11:26:44,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +50: [2023-04-29 11:26:44,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 11:26:44,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 11:26:44,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 11:26:44,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +31: [2023-04-29 11:26:44,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +47: [2023-04-29 11:26:44,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 11:26:44,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +16: [2023-04-29 11:26:44,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +19: [2023-04-29 11:26:44,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 11:26:44,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +44: [2023-04-29 11:26:44,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 11:26:44,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +16: [2023-04-29 11:26:44,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +16: [2023-04-29 11:26:44,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +47: [2023-04-29 11:26:44,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 11:26:44,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 11:26:44,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 11:26:44,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +47: [2023-04-29 11:26:44,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +33: [2023-04-29 11:26:44,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +15: [2023-04-29 11:26:44,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +15: [2023-04-29 11:26:44,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +15: [2023-04-29 11:26:44,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +28: [2023-04-29 11:26:44,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 11:26:44,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +28: [2023-04-29 11:26:44,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +44: [2023-04-29 11:26:44,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +44: [2023-04-29 11:26:44,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +44: [2023-04-29 11:26:44,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +45: [2023-04-29 11:26:44,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 11:26:44,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +16: [2023-04-29 11:26:44,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +47: [2023-04-29 11:26:44,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 11:26:44,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 11:26:44,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +45: [2023-04-29 11:26:44,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 11:26:44,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +50: [2023-04-29 11:26:44,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 11:26:44,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +49: [2023-04-29 11:26:44,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +49: [2023-04-29 11:26:44,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +45: [2023-04-29 11:26:44,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +50: [2023-04-29 11:26:44,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 11:26:44,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 11:26:44,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +34: [2023-04-29 11:26:44,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +37: [2023-04-29 11:26:44,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 11:26:44,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +57: [2023-04-29 11:26:44,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +57: [2023-04-29 11:26:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +57: [2023-04-29 11:26:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +57: [2023-04-29 11:26:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +25: [2023-04-29 11:26:44,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +33: [2023-04-29 11:26:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 11:26:44,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +33: [2023-04-29 11:26:44,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 11:26:44,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +31: [2023-04-29 11:26:44,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 11:26:44,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +49: [2023-04-29 11:26:44,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +31: [2023-04-29 11:26:44,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +49: [2023-04-29 11:26:44,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +49: [2023-04-29 11:26:44,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +46: [2023-04-29 11:26:44,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +46: [2023-04-29 11:26:44,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +45: [2023-04-29 11:26:44,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +37: [2023-04-29 11:26:44,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 11:26:44,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 11:26:44,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +11: [2023-04-29 11:26:44,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +31: [2023-04-29 11:26:44,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 11:26:44,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 11:26:44,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +52: [2023-04-29 11:26:44,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 11:26:44,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 11:26:44,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_00-model_states.pt. +46: [2023-04-29 11:26:44,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +45: [2023-04-29 11:26:44,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +46: [2023-04-29 11:26:44,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +45: [2023-04-29 11:26:44,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +20: [2023-04-29 11:26:44,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 11:26:44,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +41: [2023-04-29 11:26:44,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 11:26:44,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +20: [2023-04-29 11:26:44,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 11:26:44,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 11:26:44,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +20: [2023-04-29 11:26:44,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 11:26:44,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +18: [2023-04-29 11:26:44,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 11:26:44,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +41: [2023-04-29 11:26:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 11:26:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 11:26:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 11:26:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 11:26:44,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 11:26:44,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +18: [2023-04-29 11:26:44,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 11:26:44,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 11:26:44,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +20: [2023-04-29 11:26:44,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +30: [2023-04-29 11:26:44,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 11:26:44,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 11:26:44,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +20: [2023-04-29 11:26:44,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +52: [2023-04-29 11:26:44,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +20: [2023-04-29 11:26:44,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +20: [2023-04-29 11:26:44,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +41: [2023-04-29 11:26:44,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +29: [2023-04-29 11:26:44,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +52: [2023-04-29 11:26:44,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 11:26:44,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt... +41: [2023-04-29 11:26:44,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +20: [2023-04-29 11:26:44,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt... +41: [2023-04-29 11:26:44,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +21: [2023-04-29 11:26:44,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 11:26:44,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +41: [2023-04-29 11:26:44,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 11:26:44,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +30: [2023-04-29 11:26:44,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +41: [2023-04-29 11:26:44,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +29: [2023-04-29 11:26:44,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +41: [2023-04-29 11:26:44,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +29: [2023-04-29 11:26:44,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 11:26:44,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 11:26:44,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +41: [2023-04-29 11:26:44,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +28: [2023-04-29 11:26:44,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 11:26:44,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +41: [2023-04-29 11:26:44,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... + 2: [2023-04-29 11:26:44,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +33: [2023-04-29 11:26:44,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 11:26:44,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +30: [2023-04-29 11:26:44,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 11:26:44,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 11:26:44,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 11:26:44,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 11:26:44,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +15: [2023-04-29 11:26:44,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 11:26:44,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +57: [2023-04-29 11:26:44,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 11:26:44,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +15: [2023-04-29 11:26:44,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 11:26:44,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +14: [2023-04-29 11:26:44,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +14: [2023-04-29 11:26:44,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +14: [2023-04-29 11:26:44,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +44: [2023-04-29 11:26:44,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 11:26:44,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 11:26:44,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 11:26:44,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +28: [2023-04-29 11:26:44,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 11:26:44,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 11:26:44,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 11:26:44,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 11:26:44,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +13: [2023-04-29 11:26:44,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +29: [2023-04-29 11:26:44,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 4: [2023-04-29 11:26:44,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +11: [2023-04-29 11:26:44,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 11:26:44,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 11:26:44,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +57: [2023-04-29 11:26:44,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +33: [2023-04-29 11:26:44,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 11:26:44,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +57: [2023-04-29 11:26:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 11:26:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 11:26:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +30: [2023-04-29 11:26:44,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +44: [2023-04-29 11:26:44,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 11:26:44,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 11:26:44,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +13: [2023-04-29 11:26:44,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +44: [2023-04-29 11:26:44,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 11:26:44,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 11:26:44,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 11:26:44,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 11:26:44,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 11:26:44,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 11:26:44,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 11:26:44,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +38: [2023-04-29 11:26:44,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +13: [2023-04-29 11:26:44,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +38: [2023-04-29 11:26:44,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +38: [2023-04-29 11:26:44,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +11: [2023-04-29 11:26:44,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +11: [2023-04-29 11:26:44,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +30: [2023-04-29 11:26:44,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +37: [2023-04-29 11:26:44,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +28: [2023-04-29 11:26:44,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +11: [2023-04-29 11:26:44,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +38: [2023-04-29 11:26:44,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 11:26:44,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 11:26:44,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 11:26:44,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 11:26:44,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 11:26:44,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +13: [2023-04-29 11:26:44,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +21: [2023-04-29 11:26:44,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:44,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +38: [2023-04-29 11:26:44,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +28: [2023-04-29 11:26:44,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +38: [2023-04-29 11:26:44,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +28: [2023-04-29 11:26:44,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 9: [2023-04-29 11:26:44,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +38: [2023-04-29 11:26:44,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +38: [2023-04-29 11:26:44,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +28: [2023-04-29 11:26:44,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +13: [2023-04-29 11:26:44,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +13: [2023-04-29 11:26:44,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +28: [2023-04-29 11:26:44,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +28: [2023-04-29 11:26:44,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +47: [2023-04-29 11:26:44,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 4: [2023-04-29 11:26:44,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 11:26:44,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +30: [2023-04-29 11:26:44,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:44,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +21: [2023-04-29 11:26:44,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:44,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +21: [2023-04-29 11:26:44,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:44,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +21: [2023-04-29 11:26:44,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 11:26:44,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +47: [2023-04-29 11:26:44,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +14: [2023-04-29 11:26:44,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 11:26:44,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... +14: [2023-04-29 11:26:44,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 11:26:44,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 11:26:44,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 11:26:44,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt... + 9: [2023-04-29 11:26:44,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +19: [2023-04-29 11:26:44,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +19: [2023-04-29 11:26:44,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +38: [2023-04-29 11:26:44,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +19: [2023-04-29 11:26:44,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +20: [2023-04-29 11:26:44,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +19: [2023-04-29 11:26:44,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +50: [2023-04-29 11:26:44,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 11:26:44,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 11:26:44,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 11:26:44,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +47: [2023-04-29 11:26:44,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 11:26:44,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 11:26:44,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 11:26:44,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 11:26:44,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 11:26:44,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +48: [2023-04-29 11:26:44,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 11:26:44,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 0: [2023-04-29 11:26:44,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +48: [2023-04-29 11:26:44,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 11:26:44,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 11:26:44,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 11:26:44,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 11:26:44,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 11:26:44,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 0: [2023-04-29 11:26:44,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +20: [2023-04-29 11:26:44,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +48: [2023-04-29 11:26:44,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +41: [2023-04-29 11:26:44,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 11:26:44,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 11:26:44,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +48: [2023-04-29 11:26:44,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 11:26:44,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 11:26:44,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +20: [2023-04-29 11:26:44,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +48: [2023-04-29 11:26:44,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +48: [2023-04-29 11:26:44,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 11:26:44,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +20: [2023-04-29 11:26:44,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_00-model_states.pt. +41: [2023-04-29 11:26:44,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +41: [2023-04-29 11:26:44,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +47: [2023-04-29 11:26:44,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +20: [2023-04-29 11:26:44,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +40: [2023-04-29 11:26:44,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 11:26:44,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 11:26:44,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 11:26:44,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +50: [2023-04-29 11:26:44,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +50: [2023-04-29 11:26:44,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +50: [2023-04-29 11:26:44,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. + 2: [2023-04-29 11:26:44,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 11:26:44,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 11:26:44,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 11:26:44,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 11:26:44,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +50: [2023-04-29 11:26:44,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +10: [2023-04-29 11:26:44,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +10: [2023-04-29 11:26:44,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +10: [2023-04-29 11:26:44,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +40: [2023-04-29 11:26:44,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +10: [2023-04-29 11:26:44,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +44: [2023-04-29 11:26:44,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 11:26:44,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +40: [2023-04-29 11:26:44,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +40: [2023-04-29 11:26:44,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 11:26:44,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 11:26:44,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 11:26:44,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 11:26:44,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +44: [2023-04-29 11:26:44,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 11:26:44,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +20: [2023-04-29 11:26:44,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +58: [2023-04-29 11:26:44,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 11:26:44,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 11:26:44,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 11:26:44,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 11:26:44,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 11:26:44,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 11:26:44,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +58: [2023-04-29 11:26:44,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 7: [2023-04-29 11:26:44,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 7: [2023-04-29 11:26:44,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +50: [2023-04-29 11:26:44,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 2: [2023-04-29 11:26:44,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +50: [2023-04-29 11:26:44,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 11:26:44,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 11:26:44,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 11:26:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +34: [2023-04-29 11:26:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +41: [2023-04-29 11:26:44,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 11:26:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +34: [2023-04-29 11:26:44,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +58: [2023-04-29 11:26:44,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 11:26:44,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 11:26:44,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 11:26:44,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +58: [2023-04-29 11:26:44,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +58: [2023-04-29 11:26:44,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +58: [2023-04-29 11:26:44,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +58: [2023-04-29 11:26:44,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +41: [2023-04-29 11:26:44,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +20: [2023-04-29 11:26:44,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 11:26:44,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +38: [2023-04-29 11:26:44,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +41: [2023-04-29 11:26:44,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 11:26:44,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +42: [2023-04-29 11:26:44,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +42: [2023-04-29 11:26:44,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +42: [2023-04-29 11:26:44,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +50: [2023-04-29 11:26:44,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +38: [2023-04-29 11:26:44,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 11:26:44,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 11:26:44,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 11:26:44,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +50: [2023-04-29 11:26:44,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +10: [2023-04-29 11:26:44,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +50: [2023-04-29 11:26:44,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 11:26:44,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +10: [2023-04-29 11:26:44,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +44: [2023-04-29 11:26:44,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 11:26:44,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 11:26:44,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 11:26:44,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 11:26:44,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +38: [2023-04-29 11:26:44,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 11:26:44,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 11:26:44,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 11:26:44,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 11:26:44,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 11:26:44,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 11:26:44,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 11:26:44,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 11:26:44,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 11:26:44,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +10: [2023-04-29 11:26:44,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 11:26:44,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 7: [2023-04-29 11:26:44,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +10: [2023-04-29 11:26:44,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +34: [2023-04-29 11:26:44,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 11:26:44,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +36: [2023-04-29 11:26:44,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +36: [2023-04-29 11:26:44,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +36: [2023-04-29 11:26:44,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +44: [2023-04-29 11:26:44,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 8: [2023-04-29 11:26:44,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 8: [2023-04-29 11:26:44,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 8: [2023-04-29 11:26:44,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +11: [2023-04-29 11:26:44,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 11:26:44,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +12: [2023-04-29 11:26:44,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +38: [2023-04-29 11:26:44,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 11:26:44,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +35: [2023-04-29 11:26:44,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 11:26:44,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +11: [2023-04-29 11:26:44,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 11:26:44,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +38: [2023-04-29 11:26:44,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +11: [2023-04-29 11:26:44,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +35: [2023-04-29 11:26:44,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 11:26:44,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 11:26:44,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 11:26:44,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 11:26:44,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 11:26:44,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 11:26:44,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 11:26:44,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +61: [2023-04-29 11:26:44,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +61: [2023-04-29 11:26:44,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +47: [2023-04-29 11:26:44,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +47: [2023-04-29 11:26:44,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +61: [2023-04-29 11:26:44,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +37: [2023-04-29 11:26:44,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +37: [2023-04-29 11:26:44,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +38: [2023-04-29 11:26:44,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +34: [2023-04-29 11:26:44,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 11:26:44,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +37: [2023-04-29 11:26:44,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +35: [2023-04-29 11:26:44,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... + 4: [2023-04-29 11:26:44,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +42: [2023-04-29 11:26:44,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:44,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:44,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:44,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 11:26:44,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +35: [2023-04-29 11:26:44,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 11:26:44,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +48: [2023-04-29 11:26:44,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +48: [2023-04-29 11:26:44,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 11:26:44,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 11:26:44,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +35: [2023-04-29 11:26:44,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +35: [2023-04-29 11:26:44,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 11:26:44,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 11:26:44,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +35: [2023-04-29 11:26:44,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +38: [2023-04-29 11:26:44,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +35: [2023-04-29 11:26:44,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +38: [2023-04-29 11:26:44,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... + 4: [2023-04-29 11:26:44,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +48: [2023-04-29 11:26:44,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +48: [2023-04-29 11:26:44,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +38: [2023-04-29 11:26:44,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +19: [2023-04-29 11:26:44,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 11:26:44,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +36: [2023-04-29 11:26:44,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 11:26:44,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +40: [2023-04-29 11:26:44,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +19: [2023-04-29 11:26:44,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 11:26:44,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 11:26:44,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +38: [2023-04-29 11:26:44,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 11:26:44,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 11:26:44,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +49: [2023-04-29 11:26:44,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +12: [2023-04-29 11:26:44,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 11:26:44,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 11:26:44,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +38: [2023-04-29 11:26:44,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +12: [2023-04-29 11:26:44,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +36: [2023-04-29 11:26:44,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 11:26:44,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:44,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 11:26:44,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +32: [2023-04-29 11:26:44,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +40: [2023-04-29 11:26:44,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +42: [2023-04-29 11:26:44,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +49: [2023-04-29 11:26:44,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +49: [2023-04-29 11:26:44,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +42: [2023-04-29 11:26:44,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +19: [2023-04-29 11:26:44,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +19: [2023-04-29 11:26:44,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +19: [2023-04-29 11:26:44,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +49: [2023-04-29 11:26:44,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +38: [2023-04-29 11:26:44,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... + 8: [2023-04-29 11:26:44,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +61: [2023-04-29 11:26:44,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +61: [2023-04-29 11:26:44,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 11:26:44,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +40: [2023-04-29 11:26:44,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +61: [2023-04-29 11:26:44,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 11:26:44,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 11:26:44,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +61: [2023-04-29 11:26:44,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 11:26:44,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:44,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:44,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +47: [2023-04-29 11:26:44,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:44,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 11:26:44,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 11:26:44,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +49: [2023-04-29 11:26:44,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:44,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 11:26:44,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +48: [2023-04-29 11:26:44,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 11:26:44,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 11:26:44,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +37: [2023-04-29 11:26:44,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +50: [2023-04-29 11:26:44,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 11:26:44,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +58: [2023-04-29 11:26:44,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 11:26:44,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 11:26:44,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +50: [2023-04-29 11:26:44,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +50: [2023-04-29 11:26:44,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +58: [2023-04-29 11:26:44,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 11:26:44,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +39: [2023-04-29 11:26:44,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +39: [2023-04-29 11:26:44,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +40: [2023-04-29 11:26:44,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 11:26:44,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +48: [2023-04-29 11:26:44,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 11:26:44,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 11:26:44,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +56: [2023-04-29 11:26:44,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +50: [2023-04-29 11:26:44,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +10: [2023-04-29 11:26:44,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +40: [2023-04-29 11:26:44,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 11:26:44,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +32: [2023-04-29 11:26:44,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 11:26:44,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +50: [2023-04-29 11:26:44,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 11:26:44,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +10: [2023-04-29 11:26:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 11:26:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +57: [2023-04-29 11:26:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 11:26:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 11:26:44,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 11:26:44,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +50: [2023-04-29 11:26:44,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 11:26:44,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 11:26:44,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 11:26:44,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 11:26:44,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 11:26:44,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 11:26:44,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +55: [2023-04-29 11:26:44,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +55: [2023-04-29 11:26:44,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +34: [2023-04-29 11:26:44,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +55: [2023-04-29 11:26:44,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +55: [2023-04-29 11:26:44,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +32: [2023-04-29 11:26:44,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 11:26:44,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +11: [2023-04-29 11:26:44,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +40: [2023-04-29 11:26:44,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +40: [2023-04-29 11:26:44,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +40: [2023-04-29 11:26:44,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +57: [2023-04-29 11:26:44,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +10: [2023-04-29 11:26:44,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +57: [2023-04-29 11:26:44,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 11:26:44,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +46: [2023-04-29 11:26:44,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +50: [2023-04-29 11:26:44,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +46: [2023-04-29 11:26:44,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 11:26:44,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +46: [2023-04-29 11:26:44,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +46: [2023-04-29 11:26:44,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 11:26:44,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 11:26:44,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 11:26:44,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +46: [2023-04-29 11:26:44,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 11:26:44,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +57: [2023-04-29 11:26:44,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 11:26:44,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 11:26:44,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 11:26:44,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 11:26:44,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 11:26:44,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +62: [2023-04-29 11:26:44,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +62: [2023-04-29 11:26:44,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +62: [2023-04-29 11:26:44,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +34: [2023-04-29 11:26:44,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +34: [2023-04-29 11:26:44,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +11: [2023-04-29 11:26:44,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +35: [2023-04-29 11:26:44,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +57: [2023-04-29 11:26:44,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +10: [2023-04-29 11:26:44,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +58: [2023-04-29 11:26:44,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 11:26:44,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 11:26:44,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 11:26:44,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 11:26:44,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 11:26:44,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 11:26:44,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 11:26:44,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 11:26:44,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 11:26:44,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 11:26:44,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +34: [2023-04-29 11:26:44,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +11: [2023-04-29 11:26:44,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +42: [2023-04-29 11:26:44,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +11: [2023-04-29 11:26:44,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 11:26:44,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +39: [2023-04-29 11:26:44,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 11:26:44,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 11:26:44,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 11:26:44,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +56: [2023-04-29 11:26:44,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +56: [2023-04-29 11:26:44,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 11:26:44,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +59: [2023-04-29 11:26:44,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 11:26:44,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 11:26:44,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +59: [2023-04-29 11:26:44,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +59: [2023-04-29 11:26:44,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +42: [2023-04-29 11:26:44,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +27: [2023-04-29 11:26:44,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 11:26:44,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 11:26:44,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +34: [2023-04-29 11:26:44,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +27: [2023-04-29 11:26:44,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +42: [2023-04-29 11:26:44,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +56: [2023-04-29 11:26:44,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +10: [2023-04-29 11:26:44,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 11:26:44,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 11:26:44,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +36: [2023-04-29 11:26:44,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +36: [2023-04-29 11:26:44,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +56: [2023-04-29 11:26:44,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:44,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +10: [2023-04-29 11:26:44,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 11:26:44,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +35: [2023-04-29 11:26:44,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 11:26:44,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +11: [2023-04-29 11:26:44,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +59: [2023-04-29 11:26:44,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 11:26:44,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 11:26:44,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +56: [2023-04-29 11:26:44,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 11:26:44,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +59: [2023-04-29 11:26:44,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +56: [2023-04-29 11:26:44,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 11:26:44,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 11:26:44,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +27: [2023-04-29 11:26:44,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 11:26:44,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +35: [2023-04-29 11:26:44,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +27: [2023-04-29 11:26:44,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +56: [2023-04-29 11:26:44,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +27: [2023-04-29 11:26:44,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +34: [2023-04-29 11:26:44,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +36: [2023-04-29 11:26:44,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +36: [2023-04-29 11:26:44,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +55: [2023-04-29 11:26:44,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 11:26:44,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 11:26:44,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +54: [2023-04-29 11:26:44,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +54: [2023-04-29 11:26:44,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +54: [2023-04-29 11:26:44,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +54: [2023-04-29 11:26:44,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 11:26:44,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 11:26:44,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +49: [2023-04-29 11:26:44,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +10: [2023-04-29 11:26:44,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +47: [2023-04-29 11:26:44,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +10: [2023-04-29 11:26:44,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +55: [2023-04-29 11:26:44,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +42: [2023-04-29 11:26:44,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 11:26:44,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 11:26:44,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +10: [2023-04-29 11:26:44,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +54: [2023-04-29 11:26:44,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 11:26:44,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +36: [2023-04-29 11:26:44,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 11:26:44,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +54: [2023-04-29 11:26:44,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 11:26:44,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +54: [2023-04-29 11:26:44,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +37: [2023-04-29 11:26:44,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 11:26:44,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +55: [2023-04-29 11:26:44,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 11:26:44,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 11:26:44,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 11:26:44,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 11:26:44,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +42: [2023-04-29 11:26:44,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +35: [2023-04-29 11:26:44,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +55: [2023-04-29 11:26:44,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +62: [2023-04-29 11:26:44,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 11:26:44,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +62: [2023-04-29 11:26:44,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 11:26:44,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 11:26:44,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +10: [2023-04-29 11:26:44,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 11:26:44,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 0: [2023-04-29 11:26:44,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 0: [2023-04-29 11:26:44,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +47: [2023-04-29 11:26:44,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +47: [2023-04-29 11:26:44,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +11: [2023-04-29 11:26:44,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +63: [2023-04-29 11:26:44,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +63: [2023-04-29 11:26:44,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +11: [2023-04-29 11:26:44,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 11:26:44,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 11:26:44,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +47: [2023-04-29 11:26:44,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 11:26:44,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +51: [2023-04-29 11:26:44,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +51: [2023-04-29 11:26:44,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +51: [2023-04-29 11:26:44,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +63: [2023-04-29 11:26:44,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +37: [2023-04-29 11:26:44,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +63: [2023-04-29 11:26:44,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +49: [2023-04-29 11:26:44,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 11:26:44,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 11:26:44,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +35: [2023-04-29 11:26:44,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 11:26:44,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 11:26:44,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 11:26:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 11:26:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 11:26:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 11:26:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 11:26:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 11:26:44,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +47: [2023-04-29 11:26:44,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +36: [2023-04-29 11:26:44,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 11:26:44,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 11:26:44,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 11:26:44,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +42: [2023-04-29 11:26:44,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +42: [2023-04-29 11:26:44,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +37: [2023-04-29 11:26:44,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +35: [2023-04-29 11:26:44,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +10: [2023-04-29 11:26:44,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 11:26:44,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +37: [2023-04-29 11:26:44,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +36: [2023-04-29 11:26:44,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +36: [2023-04-29 11:26:44,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +37: [2023-04-29 11:26:44,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +35: [2023-04-29 11:26:44,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 11:26:44,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +18: [2023-04-29 11:26:44,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +36: [2023-04-29 11:26:44,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 11:26:44,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 11:26:44,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +36: [2023-04-29 11:26:44,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 11:26:44,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +62: [2023-04-29 11:26:44,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +62: [2023-04-29 11:26:44,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +18: [2023-04-29 11:26:44,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 11:26:44,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +18: [2023-04-29 11:26:44,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +49: [2023-04-29 11:26:44,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 11:26:44,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 11:26:44,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +62: [2023-04-29 11:26:44,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +62: [2023-04-29 11:26:44,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 11:26:44,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 11:26:44,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 11:26:44,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +46: [2023-04-29 11:26:44,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +16: [2023-04-29 11:26:44,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 11:26:44,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +62: [2023-04-29 11:26:44,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 11:26:44,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 11:26:44,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 11:26:44,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 11:26:44,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 11:26:44,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +63: [2023-04-29 11:26:44,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 11:26:44,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 11:26:44,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +51: [2023-04-29 11:26:44,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 11:26:44,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +42: [2023-04-29 11:26:44,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 11:26:44,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +49: [2023-04-29 11:26:44,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 11:26:44,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +57: [2023-04-29 11:26:44,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +57: [2023-04-29 11:26:44,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 11:26:44,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +23: [2023-04-29 11:26:44,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +23: [2023-04-29 11:26:44,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +63: [2023-04-29 11:26:44,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +23: [2023-04-29 11:26:44,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +23: [2023-04-29 11:26:44,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +44: [2023-04-29 11:26:44,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +44: [2023-04-29 11:26:44,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +51: [2023-04-29 11:26:44,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 11:26:44,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +51: [2023-04-29 11:26:44,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 11:26:44,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +44: [2023-04-29 11:26:44,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +44: [2023-04-29 11:26:44,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +63: [2023-04-29 11:26:44,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +39: [2023-04-29 11:26:44,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +39: [2023-04-29 11:26:44,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 11:26:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 11:26:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 11:26:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +27: [2023-04-29 11:26:44,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +49: [2023-04-29 11:26:44,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 11:26:44,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +27: [2023-04-29 11:26:44,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +39: [2023-04-29 11:26:44,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 11:26:44,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 11:26:44,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +51: [2023-04-29 11:26:44,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +51: [2023-04-29 11:26:44,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +51: [2023-04-29 11:26:44,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +12: [2023-04-29 11:26:44,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 11:26:44,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +39: [2023-04-29 11:26:44,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +15: [2023-04-29 11:26:44,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +51: [2023-04-29 11:26:44,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 11:26:44,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +12: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +46: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 11:26:44,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +17: [2023-04-29 11:26:44,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 11:26:44,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 11:26:44,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 11:26:44,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +39: [2023-04-29 11:26:44,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +56: [2023-04-29 11:26:44,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +56: [2023-04-29 11:26:44,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +56: [2023-04-29 11:26:44,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +45: [2023-04-29 11:26:44,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. + 7: [2023-04-29 11:26:44,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +45: [2023-04-29 11:26:44,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +45: [2023-04-29 11:26:44,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +39: [2023-04-29 11:26:44,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 11:26:44,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +51: [2023-04-29 11:26:44,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +15: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +42: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +29: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +29: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +46: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +29: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +59: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +13: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +51: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +55: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +12: [2023-04-29 11:26:44,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +13: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +43: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 11:26:44,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 11:26:44,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +13: [2023-04-29 11:26:44,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +59: [2023-04-29 11:26:44,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +26: [2023-04-29 11:26:44,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +26: [2023-04-29 11:26:44,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +26: [2023-04-29 11:26:44,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +15: [2023-04-29 11:26:44,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +17: [2023-04-29 11:26:44,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +54: [2023-04-29 11:26:44,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +29: [2023-04-29 11:26:44,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +60: [2023-04-29 11:26:44,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +60: [2023-04-29 11:26:44,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +55: [2023-04-29 11:26:44,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +12: [2023-04-29 11:26:44,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +51: [2023-04-29 11:26:44,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +12: [2023-04-29 11:26:44,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 11:26:44,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +54: [2023-04-29 11:26:44,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +12: [2023-04-29 11:26:44,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +12: [2023-04-29 11:26:44,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 11:26:44,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 11:26:44,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 11:26:44,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +12: [2023-04-29 11:26:44,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 1: [2023-04-29 11:26:44,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +39: [2023-04-29 11:26:44,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 11:26:44,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +59: [2023-04-29 11:26:44,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +29: [2023-04-29 11:26:44,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +60: [2023-04-29 11:26:44,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +54: [2023-04-29 11:26:44,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +54: [2023-04-29 11:26:44,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +15: [2023-04-29 11:26:44,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +56: [2023-04-29 11:26:44,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +60: [2023-04-29 11:26:44,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +56: [2023-04-29 11:26:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +15: [2023-04-29 11:26:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +55: [2023-04-29 11:26:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +15: [2023-04-29 11:26:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +15: [2023-04-29 11:26:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 11:26:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 11:26:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 11:26:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 11:26:44,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +43: [2023-04-29 11:26:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +43: [2023-04-29 11:26:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +43: [2023-04-29 11:26:44,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +43: [2023-04-29 11:26:44,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +29: [2023-04-29 11:26:44,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +55: [2023-04-29 11:26:44,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 11:26:44,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +46: [2023-04-29 11:26:44,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 11:26:44,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 11:26:44,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 11:26:44,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +56: [2023-04-29 11:26:44,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +56: [2023-04-29 11:26:44,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +62: [2023-04-29 11:26:44,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +13: [2023-04-29 11:26:44,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +40: [2023-04-29 11:26:44,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 11:26:44,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +40: [2023-04-29 11:26:44,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +39: [2023-04-29 11:26:44,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +13: [2023-04-29 11:26:44,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +57: [2023-04-29 11:26:44,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 11:26:44,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +57: [2023-04-29 11:26:44,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +24: [2023-04-29 11:26:44,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +24: [2023-04-29 11:26:44,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +24: [2023-04-29 11:26:44,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 1: [2023-04-29 11:26:44,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +13: [2023-04-29 11:26:44,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 11:26:44,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +56: [2023-04-29 11:26:44,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +56: [2023-04-29 11:26:44,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 11:26:44,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +57: [2023-04-29 11:26:44,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 11:26:44,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 11:26:44,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +44: [2023-04-29 11:26:44,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +62: [2023-04-29 11:26:44,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +44: [2023-04-29 11:26:44,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 11:26:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 11:26:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 11:26:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 11:26:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +56: [2023-04-29 11:26:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 11:26:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 11:26:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +40: [2023-04-29 11:26:44,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +56: [2023-04-29 11:26:44,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 11:26:44,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +62: [2023-04-29 11:26:44,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +27: [2023-04-29 11:26:44,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +57: [2023-04-29 11:26:44,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 11:26:44,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +63: [2023-04-29 11:26:44,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 11:26:44,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 11:26:44,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 11:26:44,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +63: [2023-04-29 11:26:44,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 11:26:44,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +49: [2023-04-29 11:26:44,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +27: [2023-04-29 11:26:44,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +55: [2023-04-29 11:26:44,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +62: [2023-04-29 11:26:44,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +49: [2023-04-29 11:26:44,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. +63: [2023-04-29 11:26:44,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 11:26:44,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_30-model_01-model_states.pt. + 8: [2023-04-29 11:26:44,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +62: [2023-04-29 11:26:44,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 8: [2023-04-29 11:26:44,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +62: [2023-04-29 11:26:44,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +55: [2023-04-29 11:26:44,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +63: [2023-04-29 11:26:44,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 11:26:44,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 11:26:44,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +36: [2023-04-29 11:26:44,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +62: [2023-04-29 11:26:44,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +26: [2023-04-29 11:26:44,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +55: [2023-04-29 11:26:44,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +45: [2023-04-29 11:26:44,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +56: [2023-04-29 11:26:44,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 11:26:44,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 11:26:44,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +36: [2023-04-29 11:26:44,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 11:26:44,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +60: [2023-04-29 11:26:44,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +60: [2023-04-29 11:26:44,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 11:26:44,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 11:26:44,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 11:26:44,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 11:26:44,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 1: [2023-04-29 11:26:44,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 1: [2023-04-29 11:26:44,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 8: [2023-04-29 11:26:44,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +45: [2023-04-29 11:26:44,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +60: [2023-04-29 11:26:44,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +45: [2023-04-29 11:26:44,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 8: [2023-04-29 11:26:44,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +60: [2023-04-29 11:26:44,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 11:26:44,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +54: [2023-04-29 11:26:44,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 8: [2023-04-29 11:26:44,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +60: [2023-04-29 11:26:44,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 11:26:44,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +18: [2023-04-29 11:26:44,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 11:26:44,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 11:26:44,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +45: [2023-04-29 11:26:44,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +24: [2023-04-29 11:26:44,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +54: [2023-04-29 11:26:44,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +27: [2023-04-29 11:26:44,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 11:26:44,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 11:26:44,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 11:26:44,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +18: [2023-04-29 11:26:44,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +59: [2023-04-29 11:26:44,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 11:26:44,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +26: [2023-04-29 11:26:44,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +60: [2023-04-29 11:26:44,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 11:26:44,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +60: [2023-04-29 11:26:44,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 11:26:44,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 11:26:44,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +24: [2023-04-29 11:26:44,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 11:26:44,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +60: [2023-04-29 11:26:44,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 11:26:44,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 11:26:44,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +24: [2023-04-29 11:26:44,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +36: [2023-04-29 11:26:44,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 11:26:44,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 11:26:44,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +62: [2023-04-29 11:26:44,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +16: [2023-04-29 11:26:44,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +49: [2023-04-29 11:26:44,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +24: [2023-04-29 11:26:44,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 11:26:44,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +52: [2023-04-29 11:26:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +52: [2023-04-29 11:26:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +52: [2023-04-29 11:26:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +33: [2023-04-29 11:26:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +33: [2023-04-29 11:26:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +33: [2023-04-29 11:26:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +33: [2023-04-29 11:26:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +52: [2023-04-29 11:26:44,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +24: [2023-04-29 11:26:44,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 11:26:44,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +49: [2023-04-29 11:26:44,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 2: [2023-04-29 11:26:44,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 2: [2023-04-29 11:26:44,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 0: [2023-04-29 11:26:44,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +36: [2023-04-29 11:26:44,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 11:26:44,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 11:26:44,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +51: [2023-04-29 11:26:44,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +51: [2023-04-29 11:26:44,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 11:26:44,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +63: [2023-04-29 11:26:44,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +51: [2023-04-29 11:26:44,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +51: [2023-04-29 11:26:44,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +16: [2023-04-29 11:26:44,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +54: [2023-04-29 11:26:44,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +54: [2023-04-29 11:26:44,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +24: [2023-04-29 11:26:44,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 11:26:44,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 11:26:44,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +51: [2023-04-29 11:26:44,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +51: [2023-04-29 11:26:44,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +49: [2023-04-29 11:26:44,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt... +36: [2023-04-29 11:26:44,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +39: [2023-04-29 11:26:44,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:44,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +41: [2023-04-29 11:26:44,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +41: [2023-04-29 11:26:44,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +41: [2023-04-29 11:26:44,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +36: [2023-04-29 11:26:44,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 11:26:44,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +54: [2023-04-29 11:26:44,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +23: [2023-04-29 11:26:44,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 11:26:44,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 11:26:44,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 11:26:44,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 11:26:44,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +63: [2023-04-29 11:26:44,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +63: [2023-04-29 11:26:44,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +23: [2023-04-29 11:26:44,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 11:26:44,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +51: [2023-04-29 11:26:44,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +51: [2023-04-29 11:26:44,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +51: [2023-04-29 11:26:44,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +31: [2023-04-29 11:26:44,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +31: [2023-04-29 11:26:44,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +31: [2023-04-29 11:26:44,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +31: [2023-04-29 11:26:44,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +63: [2023-04-29 11:26:44,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +18: [2023-04-29 11:26:44,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 11:26:44,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +18: [2023-04-29 11:26:44,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 11:26:44,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 11:26:44,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 11:26:44,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +15: [2023-04-29 11:26:44,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +39: [2023-04-29 11:26:44,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 11:26:44,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 11:26:44,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +63: [2023-04-29 11:26:44,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +39: [2023-04-29 11:26:44,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +23: [2023-04-29 11:26:44,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 11:26:44,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 11:26:44,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +53: [2023-04-29 11:26:44,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +53: [2023-04-29 11:26:44,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +53: [2023-04-29 11:26:44,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +62: [2023-04-29 11:26:44,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 11:26:44,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 11:26:44,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +53: [2023-04-29 11:26:44,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +19: [2023-04-29 11:26:44,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 11:26:44,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 11:26:44,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 11:26:44,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 11:26:44,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +63: [2023-04-29 11:26:44,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +12: [2023-04-29 11:26:44,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +62: [2023-04-29 11:26:44,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +23: [2023-04-29 11:26:44,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 11:26:44,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 11:26:44,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 11:26:44,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 11:26:44,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +12: [2023-04-29 11:26:44,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +43: [2023-04-29 11:26:44,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +43: [2023-04-29 11:26:44,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +43: [2023-04-29 11:26:44,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +62: [2023-04-29 11:26:44,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +62: [2023-04-29 11:26:44,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +15: [2023-04-29 11:26:44,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +43: [2023-04-29 11:26:44,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +63: [2023-04-29 11:26:44,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +39: [2023-04-29 11:26:44,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 11:26:44,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:44,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +17: [2023-04-29 11:26:44,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +44: [2023-04-29 11:26:44,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +29: [2023-04-29 11:26:44,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +29: [2023-04-29 11:26:44,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 11:26:44,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +52: [2023-04-29 11:26:44,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 7: [2023-04-29 11:26:44,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +33: [2023-04-29 11:26:44,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +43: [2023-04-29 11:26:44,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +17: [2023-04-29 11:26:44,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +51: [2023-04-29 11:26:44,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 11:26:44,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +17: [2023-04-29 11:26:44,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +51: [2023-04-29 11:26:44,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +16: [2023-04-29 11:26:44,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +15: [2023-04-29 11:26:44,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +33: [2023-04-29 11:26:44,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 11:26:44,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 11:26:44,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +52: [2023-04-29 11:26:44,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 11:26:44,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 11:26:44,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +21: [2023-04-29 11:26:44,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 11:26:44,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 11:26:44,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +44: [2023-04-29 11:26:44,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +16: [2023-04-29 11:26:44,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +36: [2023-04-29 11:26:44,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 11:26:44,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +43: [2023-04-29 11:26:44,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 11:26:44,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +51: [2023-04-29 11:26:44,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 11:26:44,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 11:26:44,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +13: [2023-04-29 11:26:44,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 11:26:44,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 11:26:44,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +43: [2023-04-29 11:26:44,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +21: [2023-04-29 11:26:44,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +21: [2023-04-29 11:26:44,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 11:26:44,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 11:26:44,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +21: [2023-04-29 11:26:44,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +41: [2023-04-29 11:26:44,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 11:26:44,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +44: [2023-04-29 11:26:44,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +44: [2023-04-29 11:26:44,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +29: [2023-04-29 11:26:44,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +54: [2023-04-29 11:26:44,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 11:26:44,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 11:26:44,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 11:26:44,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 11:26:44,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 11:26:44,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 11:26:44,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 11:26:44,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +51: [2023-04-29 11:26:44,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +13: [2023-04-29 11:26:44,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +54: [2023-04-29 11:26:44,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 11:26:44,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +44: [2023-04-29 11:26:44,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +31: [2023-04-29 11:26:44,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +31: [2023-04-29 11:26:44,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +44: [2023-04-29 11:26:44,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +16: [2023-04-29 11:26:44,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +16: [2023-04-29 11:26:44,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +23: [2023-04-29 11:26:44,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +39: [2023-04-29 11:26:44,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +15: [2023-04-29 11:26:44,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +31: [2023-04-29 11:26:44,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +15: [2023-04-29 11:26:44,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 11:26:44,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +23: [2023-04-29 11:26:44,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +23: [2023-04-29 11:26:44,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +31: [2023-04-29 11:26:44,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 11:26:44,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 1: [2023-04-29 11:26:44,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 11:26:44,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 11:26:44,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +55: [2023-04-29 11:26:44,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 11:26:44,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 11:26:44,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 11:26:44,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 11:26:44,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +53: [2023-04-29 11:26:44,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +17: [2023-04-29 11:26:44,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +39: [2023-04-29 11:26:44,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 11:26:44,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +53: [2023-04-29 11:26:44,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +53: [2023-04-29 11:26:44,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +53: [2023-04-29 11:26:44,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +60: [2023-04-29 11:26:44,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 11:26:44,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +25: [2023-04-29 11:26:44,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 11:26:44,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +12: [2023-04-29 11:26:44,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 11:26:44,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +60: [2023-04-29 11:26:44,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +12: [2023-04-29 11:26:44,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 11:26:44,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +39: [2023-04-29 11:26:44,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +17: [2023-04-29 11:26:44,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +63: [2023-04-29 11:26:44,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 11:26:44,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +15: [2023-04-29 11:26:44,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 11:26:44,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 11:26:44,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +45: [2023-04-29 11:26:44,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +55: [2023-04-29 11:26:44,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +25: [2023-04-29 11:26:44,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +55: [2023-04-29 11:26:44,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +25: [2023-04-29 11:26:44,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +55: [2023-04-29 11:26:44,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +24: [2023-04-29 11:26:44,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +55: [2023-04-29 11:26:44,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 11:26:44,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +63: [2023-04-29 11:26:44,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 11:26:44,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 11:26:44,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +15: [2023-04-29 11:26:44,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +60: [2023-04-29 11:26:44,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +60: [2023-04-29 11:26:44,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +25: [2023-04-29 11:26:44,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +45: [2023-04-29 11:26:44,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +25: [2023-04-29 11:26:44,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 11:26:44,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +45: [2023-04-29 11:26:44,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +29: [2023-04-29 11:26:44,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +60: [2023-04-29 11:26:44,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +17: [2023-04-29 11:26:44,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +25: [2023-04-29 11:26:44,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +24: [2023-04-29 11:26:44,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +49: [2023-04-29 11:26:44,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +25: [2023-04-29 11:26:44,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +45: [2023-04-29 11:26:44,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +24: [2023-04-29 11:26:44,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 11:26:44,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +51: [2023-04-29 11:26:44,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:44,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:44,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +51: [2023-04-29 11:26:44,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:44,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +43: [2023-04-29 11:26:44,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +17: [2023-04-29 11:26:44,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +60: [2023-04-29 11:26:44,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +21: [2023-04-29 11:26:44,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +21: [2023-04-29 11:26:44,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 7: [2023-04-29 11:26:44,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +43: [2023-04-29 11:26:44,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:44,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 11:26:44,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +49: [2023-04-29 11:26:44,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +29: [2023-04-29 11:26:44,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +32: [2023-04-29 11:26:44,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 11:26:44,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +51: [2023-04-29 11:26:44,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +32: [2023-04-29 11:26:44,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 11:26:44,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 11:26:44,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 11:26:44,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 11:26:44,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 11:26:44,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +21: [2023-04-29 11:26:44,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +60: [2023-04-29 11:26:44,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +21: [2023-04-29 11:26:44,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 1: [2023-04-29 11:26:44,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +45: [2023-04-29 11:26:44,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +43: [2023-04-29 11:26:44,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +49: [2023-04-29 11:26:44,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +63: [2023-04-29 11:26:44,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 7: [2023-04-29 11:26:44,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +32: [2023-04-29 11:26:44,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +13: [2023-04-29 11:26:44,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 11:26:44,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +13: [2023-04-29 11:26:44,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 11:26:44,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +26: [2023-04-29 11:26:44,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 11:26:44,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 11:26:44,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 11:26:44,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 11:26:44,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 11:26:44,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 11:26:44,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 11:26:44,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 11:26:44,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +60: [2023-04-29 11:26:44,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +60: [2023-04-29 11:26:44,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 5: [2023-04-29 11:26:44,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 1: [2023-04-29 11:26:44,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 5: [2023-04-29 11:26:44,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +32: [2023-04-29 11:26:44,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +32: [2023-04-29 11:26:44,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +32: [2023-04-29 11:26:44,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +26: [2023-04-29 11:26:44,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +26: [2023-04-29 11:26:44,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 11:26:44,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +13: [2023-04-29 11:26:44,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +32: [2023-04-29 11:26:44,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +26: [2023-04-29 11:26:44,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 11:26:44,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +32: [2023-04-29 11:26:44,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +32: [2023-04-29 11:26:44,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 11:26:44,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_00-model_states.pt. +32: [2023-04-29 11:26:44,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 1: [2023-04-29 11:26:44,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 11:26:44,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +29: [2023-04-29 11:26:44,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +26: [2023-04-29 11:26:44,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +29: [2023-04-29 11:26:44,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +29: [2023-04-29 11:26:44,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +26: [2023-04-29 11:26:44,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +26: [2023-04-29 11:26:44,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +26: [2023-04-29 11:26:44,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 11:26:44,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +60: [2023-04-29 11:26:44,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 11:26:44,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +24: [2023-04-29 11:26:44,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +63: [2023-04-29 11:26:44,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 11:26:44,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +24: [2023-04-29 11:26:44,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 11:26:44,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 11:26:44,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 11:26:44,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 11:26:44,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +60: [2023-04-29 11:26:44,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +49: [2023-04-29 11:26:44,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt... +63: [2023-04-29 11:26:44,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 9: [2023-04-29 11:26:44,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +24: [2023-04-29 11:26:44,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 11:26:44,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 11:26:44,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 11:26:44,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 11:26:44,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 11:26:44,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 11:26:44,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +19: [2023-04-29 11:26:44,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 11:26:44,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 9: [2023-04-29 11:26:44,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +24: [2023-04-29 11:26:44,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +24: [2023-04-29 11:26:44,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 5: [2023-04-29 11:26:44,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 11:26:44,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 8: [2023-04-29 11:26:44,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 11:26:44,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 5: [2023-04-29 11:26:44,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 11:26:44,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +19: [2023-04-29 11:26:44,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 8: [2023-04-29 11:26:44,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +24: [2023-04-29 11:26:44,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +24: [2023-04-29 11:26:44,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +23: [2023-04-29 11:26:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 11:26:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 11:26:44,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 11:26:44,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 1: [2023-04-29 11:26:44,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +22: [2023-04-29 11:26:44,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:44,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 11:26:44,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 11:26:44,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 11:26:44,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +61: [2023-04-29 11:26:44,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 1: [2023-04-29 11:26:44,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +61: [2023-04-29 11:26:44,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 11:26:44,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 11:26:44,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 11:26:44,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 11:26:44,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 11:26:44,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 11:26:44,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 11:26:44,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 11:26:44,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +54: [2023-04-29 11:26:44,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +54: [2023-04-29 11:26:44,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 11:26:44,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +48: [2023-04-29 11:26:44,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +48: [2023-04-29 11:26:44,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +48: [2023-04-29 11:26:44,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. + 1: [2023-04-29 11:26:44,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +30: [2023-04-29 11:26:44,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:44,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:44,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:44,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +61: [2023-04-29 11:26:44,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +61: [2023-04-29 11:26:44,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +61: [2023-04-29 11:26:44,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +61: [2023-04-29 11:26:44,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 11:26:44,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 11:26:44,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 5: [2023-04-29 11:26:44,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +61: [2023-04-29 11:26:44,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +54: [2023-04-29 11:26:44,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +54: [2023-04-29 11:26:44,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 5: [2023-04-29 11:26:44,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +61: [2023-04-29 11:26:44,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +54: [2023-04-29 11:26:44,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +61: [2023-04-29 11:26:44,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +21: [2023-04-29 11:26:44,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 11:26:44,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 11:26:44,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +60: [2023-04-29 11:26:44,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +21: [2023-04-29 11:26:44,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 11:26:44,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 11:26:44,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +55: [2023-04-29 11:26:44,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +29: [2023-04-29 11:26:44,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +54: [2023-04-29 11:26:44,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +19: [2023-04-29 11:26:44,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +22: [2023-04-29 11:26:44,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +23: [2023-04-29 11:26:44,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 11:26:44,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 11:26:44,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 3: [2023-04-29 11:26:44,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 3: [2023-04-29 11:26:44,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 3: [2023-04-29 11:26:44,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +19: [2023-04-29 11:26:44,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 11:26:44,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +17: [2023-04-29 11:26:44,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +17: [2023-04-29 11:26:44,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +19: [2023-04-29 11:26:44,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 11:26:44,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 9: [2023-04-29 11:26:44,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +55: [2023-04-29 11:26:44,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +24: [2023-04-29 11:26:44,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 11:26:44,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:44,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +30: [2023-04-29 11:26:44,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +19: [2023-04-29 11:26:44,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 11:26:44,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 11:26:44,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 11:26:44,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +27: [2023-04-29 11:26:44,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +27: [2023-04-29 11:26:44,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +23: [2023-04-29 11:26:44,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 11:26:44,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 6: [2023-04-29 11:26:44,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 6: [2023-04-29 11:26:44,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 6: [2023-04-29 11:26:44,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 6: [2023-04-29 11:26:44,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +43: [2023-04-29 11:26:44,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 11:26:44,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 11:26:44,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 2: [2023-04-29 11:26:44,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 2: [2023-04-29 11:26:44,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 2: [2023-04-29 11:26:44,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +55: [2023-04-29 11:26:44,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 11:26:44,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +25: [2023-04-29 11:26:44,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +25: [2023-04-29 11:26:44,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +22: [2023-04-29 11:26:44,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:44,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +30: [2023-04-29 11:26:44,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +11: [2023-04-29 11:26:44,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +11: [2023-04-29 11:26:44,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +23: [2023-04-29 11:26:44,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +55: [2023-04-29 11:26:44,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +25: [2023-04-29 11:26:44,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +48: [2023-04-29 11:26:44,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +43: [2023-04-29 11:26:44,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +43: [2023-04-29 11:26:44,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +43: [2023-04-29 11:26:44,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +25: [2023-04-29 11:26:44,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +11: [2023-04-29 11:26:44,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 4: [2023-04-29 11:26:44,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 11:26:44,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +48: [2023-04-29 11:26:44,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +25: [2023-04-29 11:26:44,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +43: [2023-04-29 11:26:44,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 11:26:44,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 11:26:44,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 11:26:44,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 11:26:44,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +48: [2023-04-29 11:26:44,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 11:26:44,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 11:26:44,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +43: [2023-04-29 11:26:44,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +22: [2023-04-29 11:26:44,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +22: [2023-04-29 11:26:44,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +55: [2023-04-29 11:26:44,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:44,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +14: [2023-04-29 11:26:44,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 11:26:44,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 11:26:44,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 11:26:44,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 11:26:44,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 11:26:44,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 11:26:44,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +28: [2023-04-29 11:26:44,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +20: [2023-04-29 11:26:44,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +20: [2023-04-29 11:26:44,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +20: [2023-04-29 11:26:44,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +20: [2023-04-29 11:26:44,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +28: [2023-04-29 11:26:44,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 11:26:44,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 2: [2023-04-29 11:26:44,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 11:26:44,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +14: [2023-04-29 11:26:44,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 11:26:44,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 11:26:44,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 11:26:44,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 11:26:44,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 11:26:44,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 11:26:44,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 11:26:44,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 11:26:44,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 11:26:44,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +14: [2023-04-29 11:26:44,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +14: [2023-04-29 11:26:44,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 11:26:44,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +28: [2023-04-29 11:26:44,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +55: [2023-04-29 11:26:44,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +14: [2023-04-29 11:26:44,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 11:26:44,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 11:26:44,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 11:26:44,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 11:26:44,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 11:26:44,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +26: [2023-04-29 11:26:44,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 11:26:44,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 11:26:44,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 11:26:44,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 4: [2023-04-29 11:26:44,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 4: [2023-04-29 11:26:44,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 4: [2023-04-29 11:26:44,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +14: [2023-04-29 11:26:44,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 11:26:44,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 11:26:44,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +27: [2023-04-29 11:26:44,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +27: [2023-04-29 11:26:44,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 11:26:44,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +55: [2023-04-29 11:26:44,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +32: [2023-04-29 11:26:44,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 11:26:44,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 11:26:44,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +32: [2023-04-29 11:26:44,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +31: [2023-04-29 11:26:44,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 11:26:44,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 11:26:44,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 11:26:44,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 11:26:44,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 11:26:44,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 11:26:44,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 11:26:44,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 11:26:44,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 11:26:44,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +25: [2023-04-29 11:26:44,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:44,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 11:26:44,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +55: [2023-04-29 11:26:44,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +16: [2023-04-29 11:26:44,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 11:26:44,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +16: [2023-04-29 11:26:44,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 11:26:44,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 11:26:44,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 11:26:44,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 11:26:44,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +31: [2023-04-29 11:26:44,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +31: [2023-04-29 11:26:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +31: [2023-04-29 11:26:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +31: [2023-04-29 11:26:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +31: [2023-04-29 11:26:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +31: [2023-04-29 11:26:44,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +31: [2023-04-29 11:26:44,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +31: [2023-04-29 11:26:44,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +25: [2023-04-29 11:26:44,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +25: [2023-04-29 11:26:44,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +30: [2023-04-29 11:26:44,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +61: [2023-04-29 11:26:44,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +21: [2023-04-29 11:26:44,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 11:26:44,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +25: [2023-04-29 11:26:44,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 11:26:44,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 11:26:44,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 11:26:44,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 11:26:44,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +16: [2023-04-29 11:26:44,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +11: [2023-04-29 11:26:44,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 11:26:44,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 11:26:44,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 11:26:44,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 11:26:44,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +16: [2023-04-29 11:26:44,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 11:26:44,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 11:26:44,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 11:26:44,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +21: [2023-04-29 11:26:44,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +20: [2023-04-29 11:26:44,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +13: [2023-04-29 11:26:44,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 5: [2023-04-29 11:26:44,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 11:26:44,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +13: [2023-04-29 11:26:44,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. +21: [2023-04-29 11:26:44,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +13: [2023-04-29 11:26:44,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_08-model_01-model_states.pt. + 5: [2023-04-29 11:26:44,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 11:26:44,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 11:26:44,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 11:26:44,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 11:26:44,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 11:26:44,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +26: [2023-04-29 11:26:44,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +61: [2023-04-29 11:26:44,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 11:26:44,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +26: [2023-04-29 11:26:44,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +22: [2023-04-29 11:26:44,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +21: [2023-04-29 11:26:44,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +28: [2023-04-29 11:26:44,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +11: [2023-04-29 11:26:44,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 11:26:44,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 11:26:44,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +21: [2023-04-29 11:26:44,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 4: [2023-04-29 11:26:44,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +28: [2023-04-29 11:26:44,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +26: [2023-04-29 11:26:44,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +26: [2023-04-29 11:26:44,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +22: [2023-04-29 11:26:44,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 11:26:44,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +20: [2023-04-29 11:26:44,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +14: [2023-04-29 11:26:44,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +29: [2023-04-29 11:26:44,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 11:26:44,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 11:26:44,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 11:26:44,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +29: [2023-04-29 11:26:44,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +61: [2023-04-29 11:26:44,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 11:26:44,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 11:26:44,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 11:26:44,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 11:26:44,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 11:26:44,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 11:26:44,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 11:26:44,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 11:26:44,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +32: [2023-04-29 11:26:44,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +32: [2023-04-29 11:26:44,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +29: [2023-04-29 11:26:44,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +29: [2023-04-29 11:26:44,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +30: [2023-04-29 11:26:44,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 11:26:44,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 11:26:44,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +32: [2023-04-29 11:26:44,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 11:26:44,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +32: [2023-04-29 11:26:44,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +29: [2023-04-29 11:26:44,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 9: [2023-04-29 11:26:44,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +53: [2023-04-29 11:26:44,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +29: [2023-04-29 11:26:44,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +53: [2023-04-29 11:26:44,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +53: [2023-04-29 11:26:44,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +53: [2023-04-29 11:26:44,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 9: [2023-04-29 11:26:44,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +53: [2023-04-29 11:26:44,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +53: [2023-04-29 11:26:44,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +53: [2023-04-29 11:26:44,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 4: [2023-04-29 11:26:44,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +53: [2023-04-29 11:26:44,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 11:26:44,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 5: [2023-04-29 11:26:44,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 9: [2023-04-29 11:26:44,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +38: [2023-04-29 11:26:44,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +38: [2023-04-29 11:26:44,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +38: [2023-04-29 11:26:44,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. + 9: [2023-04-29 11:26:44,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +38: [2023-04-29 11:26:44,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. + 5: [2023-04-29 11:26:44,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +58: [2023-04-29 11:26:44,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +58: [2023-04-29 11:26:44,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +58: [2023-04-29 11:26:44,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +58: [2023-04-29 11:26:44,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +61: [2023-04-29 11:26:44,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +61: [2023-04-29 11:26:44,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +13: [2023-04-29 11:26:44,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +13: [2023-04-29 11:26:44,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 5: [2023-04-29 11:26:44,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 2: [2023-04-29 11:26:44,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 11:26:44,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +13: [2023-04-29 11:26:44,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +17: [2023-04-29 11:26:44,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 11:26:44,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 11:26:44,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 11:26:44,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 11:26:44,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 11:26:44,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 11:26:44,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 11:26:44,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 11:26:44,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 9: [2023-04-29 11:26:44,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 11:26:44,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 11:26:44,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 6: [2023-04-29 11:26:44,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 11:26:44,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 11:26:44,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 11:26:44,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:44,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +61: [2023-04-29 11:26:44,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 9: [2023-04-29 11:26:44,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 9: [2023-04-29 11:26:44,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 4: [2023-04-29 11:26:44,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 11:26:44,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 11:26:44,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 11:26:44,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 11:26:44,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +10: [2023-04-29 11:26:44,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:44,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 11:26:44,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 11:26:44,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +10: [2023-04-29 11:26:44,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 11:26:44,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 11:26:44,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +27: [2023-04-29 11:26:44,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 11:26:44,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 11:26:44,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +11: [2023-04-29 11:26:44,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 6: [2023-04-29 11:26:44,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +30: [2023-04-29 11:26:44,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +27: [2023-04-29 11:26:44,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 11:26:44,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +31: [2023-04-29 11:26:44,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +17: [2023-04-29 11:26:44,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +25: [2023-04-29 11:26:44,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 11:26:44,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 11:26:44,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +31: [2023-04-29 11:26:44,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 11:26:44,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 11:26:44,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +38: [2023-04-29 11:26:44,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +11: [2023-04-29 11:26:44,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +38: [2023-04-29 11:26:44,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 11:26:44,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +27: [2023-04-29 11:26:44,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +31: [2023-04-29 11:26:44,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 11:26:44,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +58: [2023-04-29 11:26:44,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 11:26:44,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +25: [2023-04-29 11:26:44,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 11:26:44,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 11:26:44,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 11:26:44,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +38: [2023-04-29 11:26:44,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 11:26:44,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +25: [2023-04-29 11:26:44,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +25: [2023-04-29 11:26:44,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 2: [2023-04-29 11:26:44,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +58: [2023-04-29 11:26:44,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +22: [2023-04-29 11:26:44,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +22: [2023-04-29 11:26:44,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +58: [2023-04-29 11:26:44,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +14: [2023-04-29 11:26:44,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 11:26:44,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +58: [2023-04-29 11:26:44,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +25: [2023-04-29 11:26:44,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +14: [2023-04-29 11:26:44,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 11:26:44,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +14: [2023-04-29 11:26:44,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +37: [2023-04-29 11:26:44,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 11:26:44,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 11:26:44,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 11:26:44,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 11:26:44,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 11:26:44,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 11:26:44,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 11:26:44,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +22: [2023-04-29 11:26:44,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +22: [2023-04-29 11:26:44,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 3: [2023-04-29 11:26:44,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 11:26:44,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 11:26:44,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 11:26:44,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 11:26:44,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 11:26:44,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 3: [2023-04-29 11:26:44,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +20: [2023-04-29 11:26:44,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +47: [2023-04-29 11:26:44,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +47: [2023-04-29 11:26:44,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +47: [2023-04-29 11:26:44,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +14: [2023-04-29 11:26:44,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +47: [2023-04-29 11:26:44,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +37: [2023-04-29 11:26:44,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 11:26:44,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 11:26:44,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +14: [2023-04-29 11:26:44,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +37: [2023-04-29 11:26:44,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +14: [2023-04-29 11:26:44,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 11:26:44,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 11:26:44,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 11:26:44,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 11:26:44,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 4: [2023-04-29 11:26:44,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 11:26:44,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +37: [2023-04-29 11:26:44,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +20: [2023-04-29 11:26:44,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +11: [2023-04-29 11:26:44,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +45: [2023-04-29 11:26:44,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +37: [2023-04-29 11:26:44,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 11:26:44,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +20: [2023-04-29 11:26:44,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... + 3: [2023-04-29 11:26:44,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +53: [2023-04-29 11:26:44,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +28: [2023-04-29 11:26:44,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 11:26:44,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 11:26:44,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt... +22: [2023-04-29 11:26:44,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. + 2: [2023-04-29 11:26:44,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 11:26:44,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 11:26:44,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +30: [2023-04-29 11:26:44,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +14: [2023-04-29 11:26:44,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +14: [2023-04-29 11:26:44,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +22: [2023-04-29 11:26:44,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +33: [2023-04-29 11:26:44,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 11:26:44,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 11:26:44,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +33: [2023-04-29 11:26:44,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 11:26:44,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 11:26:44,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 11:26:44,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 11:26:44,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +28: [2023-04-29 11:26:44,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 11:26:44,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 11:26:44,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +20: [2023-04-29 11:26:44,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +22: [2023-04-29 11:26:44,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 4: [2023-04-29 11:26:44,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 11:26:44,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 11:26:44,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +33: [2023-04-29 11:26:44,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +14: [2023-04-29 11:26:44,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +33: [2023-04-29 11:26:44,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +33: [2023-04-29 11:26:44,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +28: [2023-04-29 11:26:44,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 0: [2023-04-29 11:26:44,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 0: [2023-04-29 11:26:44,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 0: [2023-04-29 11:26:44,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 0: [2023-04-29 11:26:44,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +33: [2023-04-29 11:26:44,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +31: [2023-04-29 11:26:44,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +31: [2023-04-29 11:26:44,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +53: [2023-04-29 11:26:44,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +11: [2023-04-29 11:26:44,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 11:26:44,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +33: [2023-04-29 11:26:44,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 11:26:44,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +33: [2023-04-29 11:26:44,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +33: [2023-04-29 11:26:44,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +28: [2023-04-29 11:26:44,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 11:26:44,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +11: [2023-04-29 11:26:44,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 11:26:44,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 11:26:44,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +20: [2023-04-29 11:26:44,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +11: [2023-04-29 11:26:44,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 11:26:44,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +28: [2023-04-29 11:26:44,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +53: [2023-04-29 11:26:44,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 11:26:44,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +27: [2023-04-29 11:26:44,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 11:26:44,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 11:26:44,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 11:26:44,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... + 4: [2023-04-29 11:26:44,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +14: [2023-04-29 11:26:44,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +14: [2023-04-29 11:26:44,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 11:26:44,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +44: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 11:26:44,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 11:26:44,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 11:26:44,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 11:26:44,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 11:26:44,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 11:26:44,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 11:26:44,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 11:26:44,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 11:26:44,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +11: [2023-04-29 11:26:44,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +47: [2023-04-29 11:26:44,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 11:26:44,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 11:26:44,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 11:26:44,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 11:26:44,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 11:26:44,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +34: [2023-04-29 11:26:44,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 11:26:44,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +44: [2023-04-29 11:26:44,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 11:26:44,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 11:26:44,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +53: [2023-04-29 11:26:44,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 11:26:44,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 11:26:44,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +11: [2023-04-29 11:26:44,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +52: [2023-04-29 11:26:44,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 11:26:44,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 11:26:44,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 11:26:44,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 11:26:44,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 11:26:44,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 11:26:44,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +52: [2023-04-29 11:26:44,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +52: [2023-04-29 11:26:44,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +50: [2023-04-29 11:26:44,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +44: [2023-04-29 11:26:44,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 11:26:44,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +50: [2023-04-29 11:26:44,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +50: [2023-04-29 11:26:44,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +48: [2023-04-29 11:26:44,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +50: [2023-04-29 11:26:44,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 11:26:44,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 11:26:44,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +50: [2023-04-29 11:26:44,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +11: [2023-04-29 11:26:44,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +48: [2023-04-29 11:26:44,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 11:26:44,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +34: [2023-04-29 11:26:44,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +34: [2023-04-29 11:26:44,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 11:26:44,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +10: [2023-04-29 11:26:44,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +48: [2023-04-29 11:26:44,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 11:26:44,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +13: [2023-04-29 11:26:44,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +14: [2023-04-29 11:26:44,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +48: [2023-04-29 11:26:44,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +48: [2023-04-29 11:26:44,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 11:26:44,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 11:26:44,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 11:26:44,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 4: [2023-04-29 11:26:44,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +50: [2023-04-29 11:26:44,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 11:26:44,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 11:26:44,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 11:26:44,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +58: [2023-04-29 11:26:44,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +58: [2023-04-29 11:26:44,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 11:26:44,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 11:26:44,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 4: [2023-04-29 11:26:44,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +47: [2023-04-29 11:26:44,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 11:26:44,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 11:26:44,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 11:26:44,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 11:26:44,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 11:26:44,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 11:26:44,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 11:26:44,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 11:26:44,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 11:26:44,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +13: [2023-04-29 11:26:44,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +10: [2023-04-29 11:26:44,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +50: [2023-04-29 11:26:44,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 11:26:44,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +34: [2023-04-29 11:26:44,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +50: [2023-04-29 11:26:44,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 11:26:44,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +13: [2023-04-29 11:26:44,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +14: [2023-04-29 11:26:44,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +35: [2023-04-29 11:26:44,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +38: [2023-04-29 11:26:44,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 11:26:44,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 11:26:44,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +18: [2023-04-29 11:26:44,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +18: [2023-04-29 11:26:44,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +58: [2023-04-29 11:26:44,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +53: [2023-04-29 11:26:44,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +58: [2023-04-29 11:26:44,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 11:26:44,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +58: [2023-04-29 11:26:44,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 11:26:44,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 11:26:44,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +38: [2023-04-29 11:26:44,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 11:26:44,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 11:26:44,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +35: [2023-04-29 11:26:44,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +50: [2023-04-29 11:26:44,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 11:26:44,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 11:26:44,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 11:26:44,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +10: [2023-04-29 11:26:44,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 11:26:44,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 11:26:44,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +40: [2023-04-29 11:26:44,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 11:26:44,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +35: [2023-04-29 11:26:44,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +50: [2023-04-29 11:26:44,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 11:26:44,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +35: [2023-04-29 11:26:44,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 11:26:44,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 11:26:44,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 11:26:44,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 11:26:44,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +53: [2023-04-29 11:26:44,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 11:26:44,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +11: [2023-04-29 11:26:44,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +35: [2023-04-29 11:26:44,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 0: [2023-04-29 11:26:44,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 11:26:44,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +57: [2023-04-29 11:26:44,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +57: [2023-04-29 11:26:44,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +38: [2023-04-29 11:26:44,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +11: [2023-04-29 11:26:44,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 11:26:44,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +58: [2023-04-29 11:26:44,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 11:26:44,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +37: [2023-04-29 11:26:44,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +13: [2023-04-29 11:26:44,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt... +38: [2023-04-29 11:26:44,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +58: [2023-04-29 11:26:44,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +38: [2023-04-29 11:26:44,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 11:26:44,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +57: [2023-04-29 11:26:44,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +10: [2023-04-29 11:26:44,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 11:26:44,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +50: [2023-04-29 11:26:44,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 11:26:44,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +56: [2023-04-29 11:26:44,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +56: [2023-04-29 11:26:44,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +56: [2023-04-29 11:26:44,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +38: [2023-04-29 11:26:44,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 11:26:44,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +58: [2023-04-29 11:26:44,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +58: [2023-04-29 11:26:44,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 11:26:44,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 11:26:44,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +20: [2023-04-29 11:26:44,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +38: [2023-04-29 11:26:44,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +62: [2023-04-29 11:26:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +62: [2023-04-29 11:26:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +50: [2023-04-29 11:26:44,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 11:26:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +59: [2023-04-29 11:26:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +59: [2023-04-29 11:26:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +59: [2023-04-29 11:26:44,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +59: [2023-04-29 11:26:44,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +50: [2023-04-29 11:26:44,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 11:26:44,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 11:26:44,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. + 6: [2023-04-29 11:26:44,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 11:26:44,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 11:26:44,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +58: [2023-04-29 11:26:44,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 11:26:44,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +45: [2023-04-29 11:26:44,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +20: [2023-04-29 11:26:44,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +38: [2023-04-29 11:26:44,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +58: [2023-04-29 11:26:44,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +58: [2023-04-29 11:26:44,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +20: [2023-04-29 11:26:44,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +41: [2023-04-29 11:26:44,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:44,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:44,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:44,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:44,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:44,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:44,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:44,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 11:26:44,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +37: [2023-04-29 11:26:44,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +45: [2023-04-29 11:26:44,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 11:26:44,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +42: [2023-04-29 11:26:44,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +42: [2023-04-29 11:26:44,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +37: [2023-04-29 11:26:44,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +42: [2023-04-29 11:26:44,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +55: [2023-04-29 11:26:44,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +55: [2023-04-29 11:26:44,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +37: [2023-04-29 11:26:44,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +58: [2023-04-29 11:26:44,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +20: [2023-04-29 11:26:44,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_00-model_states.pt. +42: [2023-04-29 11:26:44,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +55: [2023-04-29 11:26:45,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +55: [2023-04-29 11:26:45,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +33: [2023-04-29 11:26:45,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:45,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +41: [2023-04-29 11:26:45,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 11:26:45,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +33: [2023-04-29 11:26:45,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:45,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 11:26:45,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 11:26:45,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +46: [2023-04-29 11:26:45,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +35: [2023-04-29 11:26:45,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +41: [2023-04-29 11:26:45,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +10: [2023-04-29 11:26:45,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 11:26:45,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +33: [2023-04-29 11:26:45,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 11:26:45,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 11:26:45,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +37: [2023-04-29 11:26:45,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 11:26:45,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:45,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +37: [2023-04-29 11:26:45,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 11:26:45,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 11:26:45,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +42: [2023-04-29 11:26:45,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:45,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +57: [2023-04-29 11:26:45,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 11:26:45,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +46: [2023-04-29 11:26:45,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +34: [2023-04-29 11:26:45,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 11:26:45,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 11:26:45,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 11:26:45,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +57: [2023-04-29 11:26:45,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 11:26:45,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 11:26:45,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +57: [2023-04-29 11:26:45,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 11:26:45,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 11:26:45,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +20: [2023-04-29 11:26:45,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +42: [2023-04-29 11:26:45,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 11:26:45,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +44: [2023-04-29 11:26:45,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +44: [2023-04-29 11:26:45,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 11:26:45,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +63: [2023-04-29 11:26:45,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +62: [2023-04-29 11:26:45,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +46: [2023-04-29 11:26:45,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 11:26:45,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 11:26:45,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 11:26:45,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 11:26:45,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +62: [2023-04-29 11:26:45,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 11:26:45,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 11:26:45,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 11:26:45,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +57: [2023-04-29 11:26:45,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +62: [2023-04-29 11:26:45,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +46: [2023-04-29 11:26:45,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +20: [2023-04-29 11:26:45,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +42: [2023-04-29 11:26:45,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 11:26:45,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 11:26:45,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 11:26:45,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 11:26:45,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +63: [2023-04-29 11:26:45,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +42: [2023-04-29 11:26:45,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 11:26:45,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +44: [2023-04-29 11:26:45,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +45: [2023-04-29 11:26:45,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 11:26:45,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 11:26:45,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 11:26:45,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 11:26:45,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 11:26:45,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 11:26:45,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 11:26:45,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 11:26:45,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +47: [2023-04-29 11:26:45,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 11:26:45,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 11:26:45,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 11:26:45,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +47: [2023-04-29 11:26:45,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 0: [2023-04-29 11:26:45,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +46: [2023-04-29 11:26:45,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 11:26:45,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 11:26:45,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +20: [2023-04-29 11:26:45,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +47: [2023-04-29 11:26:45,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +47: [2023-04-29 11:26:45,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 11:26:45,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 11:26:45,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 11:26:45,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 11:26:45,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +42: [2023-04-29 11:26:45,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +20: [2023-04-29 11:26:45,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +47: [2023-04-29 11:26:45,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +38: [2023-04-29 11:26:45,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 11:26:45,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 11:26:45,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 7: [2023-04-29 11:26:45,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +55: [2023-04-29 11:26:45,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 11:26:45,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +58: [2023-04-29 11:26:45,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +42: [2023-04-29 11:26:45,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 11:26:45,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +33: [2023-04-29 11:26:45,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +47: [2023-04-29 11:26:45,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 7: [2023-04-29 11:26:45,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +33: [2023-04-29 11:26:45,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +42: [2023-04-29 11:26:45,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 11:26:45,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +48: [2023-04-29 11:26:45,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 11:26:45,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +48: [2023-04-29 11:26:45,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +46: [2023-04-29 11:26:45,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +46: [2023-04-29 11:26:45,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +52: [2023-04-29 11:26:45,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 11:26:45,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 11:26:45,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +18: [2023-04-29 11:26:45,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +18: [2023-04-29 11:26:45,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +37: [2023-04-29 11:26:45,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 11:26:45,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +37: [2023-04-29 11:26:45,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 11:26:45,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 11:26:45,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +55: [2023-04-29 11:26:45,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 11:26:45,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +55: [2023-04-29 11:26:45,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 11:26:45,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 11:26:45,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +37: [2023-04-29 11:26:45,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +18: [2023-04-29 11:26:45,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +36: [2023-04-29 11:26:45,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +36: [2023-04-29 11:26:45,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +36: [2023-04-29 11:26:45,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +58: [2023-04-29 11:26:45,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +58: [2023-04-29 11:26:45,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 11:26:45,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 11:26:45,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +38: [2023-04-29 11:26:45,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 11:26:45,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 11:26:45,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 11:26:45,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 11:26:45,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 11:26:45,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 11:26:45,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 11:26:45,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 11:26:45,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +40: [2023-04-29 11:26:45,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +47: [2023-04-29 11:26:45,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 11:26:45,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 11:26:45,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 11:26:45,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +38: [2023-04-29 11:26:45,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 11:26:45,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +40: [2023-04-29 11:26:45,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. + 0: [2023-04-29 11:26:45,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +63: [2023-04-29 11:26:45,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +63: [2023-04-29 11:26:45,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +37: [2023-04-29 11:26:45,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +17: [2023-04-29 11:26:45,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +17: [2023-04-29 11:26:45,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +17: [2023-04-29 11:26:45,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +17: [2023-04-29 11:26:45,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +63: [2023-04-29 11:26:45,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +37: [2023-04-29 11:26:45,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 11:26:45,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +58: [2023-04-29 11:26:45,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 11:26:45,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 11:26:45,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 11:26:45,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +44: [2023-04-29 11:26:45,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +47: [2023-04-29 11:26:45,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 11:26:45,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 11:26:45,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 11:26:45,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +63: [2023-04-29 11:26:45,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +59: [2023-04-29 11:26:45,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +17: [2023-04-29 11:26:45,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 11:26:45,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 11:26:45,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +44: [2023-04-29 11:26:45,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 11:26:45,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +50: [2023-04-29 11:26:45,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 11:26:45,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +59: [2023-04-29 11:26:45,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +50: [2023-04-29 11:26:45,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +17: [2023-04-29 11:26:45,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +52: [2023-04-29 11:26:45,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 11:26:45,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +17: [2023-04-29 11:26:45,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +59: [2023-04-29 11:26:45,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +57: [2023-04-29 11:26:45,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 11:26:45,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +38: [2023-04-29 11:26:45,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +48: [2023-04-29 11:26:45,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 11:26:45,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 11:26:45,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 11:26:45,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 11:26:45,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +33: [2023-04-29 11:26:45,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +39: [2023-04-29 11:26:45,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +39: [2023-04-29 11:26:45,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +27: [2023-04-29 11:26:45,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 11:26:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +34: [2023-04-29 11:26:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 11:26:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 11:26:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +57: [2023-04-29 11:26:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 11:26:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +52: [2023-04-29 11:26:45,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 11:26:45,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +27: [2023-04-29 11:26:45,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +57: [2023-04-29 11:26:45,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +27: [2023-04-29 11:26:45,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +50: [2023-04-29 11:26:45,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 11:26:45,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +48: [2023-04-29 11:26:45,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +57: [2023-04-29 11:26:45,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 11:26:45,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +52: [2023-04-29 11:26:45,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 11:26:45,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 11:26:45,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 11:26:45,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +50: [2023-04-29 11:26:45,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +48: [2023-04-29 11:26:45,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +48: [2023-04-29 11:26:45,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 11:26:45,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +57: [2023-04-29 11:26:45,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 11:26:45,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +58: [2023-04-29 11:26:45,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 11:26:45,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +57: [2023-04-29 11:26:45,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +35: [2023-04-29 11:26:45,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +41: [2023-04-29 11:26:45,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 11:26:45,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 0: [2023-04-29 11:26:45,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +18: [2023-04-29 11:26:45,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +50: [2023-04-29 11:26:45,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +34: [2023-04-29 11:26:45,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +18: [2023-04-29 11:26:45,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 11:26:45,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 11:26:45,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 11:26:45,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +44: [2023-04-29 11:26:45,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 11:26:45,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +45: [2023-04-29 11:26:45,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +45: [2023-04-29 11:26:45,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +36: [2023-04-29 11:26:45,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +36: [2023-04-29 11:26:45,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 11:26:45,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +38: [2023-04-29 11:26:45,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 11:26:45,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +34: [2023-04-29 11:26:45,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +47: [2023-04-29 11:26:45,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 11:26:45,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +38: [2023-04-29 11:26:45,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +41: [2023-04-29 11:26:45,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +58: [2023-04-29 11:26:45,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +58: [2023-04-29 11:26:45,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +41: [2023-04-29 11:26:45,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:45,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 11:26:45,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +15: [2023-04-29 11:26:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 11:26:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 8: [2023-04-29 11:26:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 11:26:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 11:26:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +60: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. + 8: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +60: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +60: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +12: [2023-04-29 11:26:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 11:26:45,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +60: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +40: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +12: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +47: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +47: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +40: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +40: [2023-04-29 11:26:45,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +34: [2023-04-29 11:26:45,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +18: [2023-04-29 11:26:45,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +40: [2023-04-29 11:26:45,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +40: [2023-04-29 11:26:45,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +15: [2023-04-29 11:26:45,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 11:26:45,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +40: [2023-04-29 11:26:45,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +15: [2023-04-29 11:26:45,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +15: [2023-04-29 11:26:45,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +15: [2023-04-29 11:26:45,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 11:26:45,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 11:26:45,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 11:26:45,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 11:26:45,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 11:26:45,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 11:26:45,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 11:26:45,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 11:26:45,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 11:26:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 11:26:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 11:26:45,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 11:26:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 11:26:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 11:26:45,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +40: [2023-04-29 11:26:45,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +13: [2023-04-29 11:26:45,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +58: [2023-04-29 11:26:45,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +59: [2023-04-29 11:26:45,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 11:26:45,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 11:26:45,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 11:26:45,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 11:26:45,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +29: [2023-04-29 11:26:45,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 11:26:45,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 11:26:45,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 11:26:45,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 11:26:45,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +39: [2023-04-29 11:26:45,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 11:26:45,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 11:26:45,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +35: [2023-04-29 11:26:45,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 11:26:45,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +18: [2023-04-29 11:26:45,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +50: [2023-04-29 11:26:45,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 11:26:45,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 11:26:45,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 11:26:45,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 11:26:45,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 11:26:45,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 11:26:45,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 11:26:45,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 11:26:45,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +35: [2023-04-29 11:26:45,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +13: [2023-04-29 11:26:45,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 11:26:45,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 11:26:45,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 11:26:45,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 11:26:45,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 11:26:45,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +39: [2023-04-29 11:26:45,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +57: [2023-04-29 11:26:45,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +39: [2023-04-29 11:26:45,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +42: [2023-04-29 11:26:45,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +57: [2023-04-29 11:26:45,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +50: [2023-04-29 11:26:45,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +46: [2023-04-29 11:26:45,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +46: [2023-04-29 11:26:45,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 11:26:45,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +59: [2023-04-29 11:26:45,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +59: [2023-04-29 11:26:45,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +23: [2023-04-29 11:26:45,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +23: [2023-04-29 11:26:45,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +34: [2023-04-29 11:26:45,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 11:26:45,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +42: [2023-04-29 11:26:45,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 11:26:45,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +42: [2023-04-29 11:26:45,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 11:26:45,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 11:26:45,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +35: [2023-04-29 11:26:45,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 0: [2023-04-29 11:26:45,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +35: [2023-04-29 11:26:45,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 1: [2023-04-29 11:26:45,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +35: [2023-04-29 11:26:45,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 11:26:45,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +41: [2023-04-29 11:26:45,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +23: [2023-04-29 11:26:45,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +45: [2023-04-29 11:26:45,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +23: [2023-04-29 11:26:45,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +57: [2023-04-29 11:26:45,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 11:26:45,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +57: [2023-04-29 11:26:45,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +55: [2023-04-29 11:26:45,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 11:26:45,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +23: [2023-04-29 11:26:45,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 11:26:45,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +37: [2023-04-29 11:26:45,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 11:26:45,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +60: [2023-04-29 11:26:45,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 11:26:45,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +55: [2023-04-29 11:26:45,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 7: [2023-04-29 11:26:45,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +45: [2023-04-29 11:26:45,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +45: [2023-04-29 11:26:45,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +57: [2023-04-29 11:26:45,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +23: [2023-04-29 11:26:45,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +34: [2023-04-29 11:26:45,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 11:26:45,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +41: [2023-04-29 11:26:45,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +41: [2023-04-29 11:26:45,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 11:26:45,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +23: [2023-04-29 11:26:45,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +41: [2023-04-29 11:26:45,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 11:26:45,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +42: [2023-04-29 11:26:45,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +42: [2023-04-29 11:26:45,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +42: [2023-04-29 11:26:45,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +42: [2023-04-29 11:26:45,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 11:26:45,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 11:26:45,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +46: [2023-04-29 11:26:45,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 11:26:45,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 11:26:45,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +60: [2023-04-29 11:26:45,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 11:26:45,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +46: [2023-04-29 11:26:45,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 11:26:45,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 11:26:45,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 11:26:45,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +17: [2023-04-29 11:26:45,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +63: [2023-04-29 11:26:45,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 11:26:45,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +34: [2023-04-29 11:26:45,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +12: [2023-04-29 11:26:45,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +12: [2023-04-29 11:26:45,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +12: [2023-04-29 11:26:45,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +17: [2023-04-29 11:26:45,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +63: [2023-04-29 11:26:45,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +37: [2023-04-29 11:26:45,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 11:26:45,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +44: [2023-04-29 11:26:45,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +12: [2023-04-29 11:26:45,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 0: [2023-04-29 11:26:45,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +42: [2023-04-29 11:26:45,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +42: [2023-04-29 11:26:45,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +42: [2023-04-29 11:26:45,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +54: [2023-04-29 11:26:45,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +54: [2023-04-29 11:26:45,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +54: [2023-04-29 11:26:45,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +54: [2023-04-29 11:26:45,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +19: [2023-04-29 11:26:45,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +19: [2023-04-29 11:26:45,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +19: [2023-04-29 11:26:45,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +59: [2023-04-29 11:26:45,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +19: [2023-04-29 11:26:45,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +55: [2023-04-29 11:26:45,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 11:26:45,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +10: [2023-04-29 11:26:45,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +34: [2023-04-29 11:26:45,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +10: [2023-04-29 11:26:45,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +10: [2023-04-29 11:26:45,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +10: [2023-04-29 11:26:45,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +46: [2023-04-29 11:26:45,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +46: [2023-04-29 11:26:45,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +44: [2023-04-29 11:26:45,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +63: [2023-04-29 11:26:45,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +46: [2023-04-29 11:26:45,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +49: [2023-04-29 11:26:45,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +49: [2023-04-29 11:26:45,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +63: [2023-04-29 11:26:45,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +46: [2023-04-29 11:26:45,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 0: [2023-04-29 11:26:45,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +46: [2023-04-29 11:26:45,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 11:26:45,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 11:26:45,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +37: [2023-04-29 11:26:45,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +42: [2023-04-29 11:26:45,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 11:26:45,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +44: [2023-04-29 11:26:45,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +63: [2023-04-29 11:26:45,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 11:26:45,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +57: [2023-04-29 11:26:45,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +17: [2023-04-29 11:26:45,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +55: [2023-04-29 11:26:45,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +42: [2023-04-29 11:26:45,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +44: [2023-04-29 11:26:45,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +37: [2023-04-29 11:26:45,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +44: [2023-04-29 11:26:45,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +49: [2023-04-29 11:26:45,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. +49: [2023-04-29 11:26:45,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_31-model_01-model_states.pt. + 7: [2023-04-29 11:26:45,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +42: [2023-04-29 11:26:45,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +42: [2023-04-29 11:26:45,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 11:26:45,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +63: [2023-04-29 11:26:45,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +44: [2023-04-29 11:26:45,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 7: [2023-04-29 11:26:45,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +42: [2023-04-29 11:26:45,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 7: [2023-04-29 11:26:45,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +40: [2023-04-29 11:26:45,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +18: [2023-04-29 11:26:45,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +36: [2023-04-29 11:26:45,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +12: [2023-04-29 11:26:45,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +42: [2023-04-29 11:26:45,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +25: [2023-04-29 11:26:45,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 11:26:45,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +40: [2023-04-29 11:26:45,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +57: [2023-04-29 11:26:45,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 11:26:45,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +59: [2023-04-29 11:26:45,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +59: [2023-04-29 11:26:45,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +36: [2023-04-29 11:26:45,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +18: [2023-04-29 11:26:45,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +25: [2023-04-29 11:26:45,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 11:26:45,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +46: [2023-04-29 11:26:45,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +12: [2023-04-29 11:26:45,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 11:26:45,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 11:26:45,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 11:26:45,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 11:26:45,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 11:26:45,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 11:26:45,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +59: [2023-04-29 11:26:45,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 11:26:45,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +36: [2023-04-29 11:26:45,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +46: [2023-04-29 11:26:45,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +25: [2023-04-29 11:26:45,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +25: [2023-04-29 11:26:45,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 11:26:45,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 11:26:45,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +25: [2023-04-29 11:26:45,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +54: [2023-04-29 11:26:45,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 11:26:45,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +19: [2023-04-29 11:26:45,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +36: [2023-04-29 11:26:45,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +25: [2023-04-29 11:26:45,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 11:26:45,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 11:26:45,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 11:26:45,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +36: [2023-04-29 11:26:45,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 0: [2023-04-29 11:26:45,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +36: [2023-04-29 11:26:45,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +15: [2023-04-29 11:26:45,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 11:26:45,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 11:26:45,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 11:26:45,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +18: [2023-04-29 11:26:45,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +18: [2023-04-29 11:26:45,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 11:26:45,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +59: [2023-04-29 11:26:45,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +15: [2023-04-29 11:26:45,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +15: [2023-04-29 11:26:45,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +12: [2023-04-29 11:26:45,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 11:26:45,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +15: [2023-04-29 11:26:45,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +19: [2023-04-29 11:26:45,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 11:26:45,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +16: [2023-04-29 11:26:45,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 11:26:45,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +10: [2023-04-29 11:26:45,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 11:26:45,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 11:26:45,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 11:26:45,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 11:26:45,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +57: [2023-04-29 11:26:45,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 11:26:45,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 11:26:45,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 11:26:45,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +40: [2023-04-29 11:26:45,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 11:26:45,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 11:26:45,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +17: [2023-04-29 11:26:45,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 11:26:45,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +17: [2023-04-29 11:26:45,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 11:26:45,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 11:26:45,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 11:26:45,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 11:26:45,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 11:26:45,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 11:26:45,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 11:26:45,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +40: [2023-04-29 11:26:45,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 11:26:45,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 11:26:45,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +18: [2023-04-29 11:26:45,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +18: [2023-04-29 11:26:45,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +18: [2023-04-29 11:26:45,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +29: [2023-04-29 11:26:45,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 11:26:45,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +51: [2023-04-29 11:26:45,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +51: [2023-04-29 11:26:45,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +51: [2023-04-29 11:26:45,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +51: [2023-04-29 11:26:45,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +22: [2023-04-29 11:26:45,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +40: [2023-04-29 11:26:45,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +22: [2023-04-29 11:26:45,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +39: [2023-04-29 11:26:45,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 5: [2023-04-29 11:26:45,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +49: [2023-04-29 11:26:45,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 11:26:45,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 11:26:45,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 11:26:45,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 11:26:45,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 11:26:45,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +39: [2023-04-29 11:26:45,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 7: [2023-04-29 11:26:45,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +22: [2023-04-29 11:26:45,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 11:26:45,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 11:26:45,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +13: [2023-04-29 11:26:45,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +40: [2023-04-29 11:26:45,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +39: [2023-04-29 11:26:45,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +40: [2023-04-29 11:26:45,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +45: [2023-04-29 11:26:45,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +61: [2023-04-29 11:26:45,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +61: [2023-04-29 11:26:45,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +61: [2023-04-29 11:26:45,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +61: [2023-04-29 11:26:45,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. + 5: [2023-04-29 11:26:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +43: [2023-04-29 11:26:45,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +43: [2023-04-29 11:26:45,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +43: [2023-04-29 11:26:45,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +43: [2023-04-29 11:26:45,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +16: [2023-04-29 11:26:45,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 11:26:45,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +45: [2023-04-29 11:26:45,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +12: [2023-04-29 11:26:45,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 11:26:45,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 11:26:45,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +57: [2023-04-29 11:26:45,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +56: [2023-04-29 11:26:45,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 11:26:45,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 11:26:45,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +45: [2023-04-29 11:26:45,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +39: [2023-04-29 11:26:45,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 1: [2023-04-29 11:26:45,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +57: [2023-04-29 11:26:45,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +23: [2023-04-29 11:26:45,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +23: [2023-04-29 11:26:45,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +23: [2023-04-29 11:26:45,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 11:26:45,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 11:26:45,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +59: [2023-04-29 11:26:45,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 11:26:45,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 11:26:45,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +16: [2023-04-29 11:26:45,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 11:26:45,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +56: [2023-04-29 11:26:45,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 11:26:45,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +57: [2023-04-29 11:26:45,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +56: [2023-04-29 11:26:45,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 11:26:45,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 11:26:45,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 11:26:45,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +45: [2023-04-29 11:26:45,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +45: [2023-04-29 11:26:45,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +59: [2023-04-29 11:26:45,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +56: [2023-04-29 11:26:45,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 11:26:45,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 8: [2023-04-29 11:26:45,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +23: [2023-04-29 11:26:45,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +56: [2023-04-29 11:26:45,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 11:26:45,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +56: [2023-04-29 11:26:45,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +32: [2023-04-29 11:26:45,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +32: [2023-04-29 11:26:45,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +32: [2023-04-29 11:26:45,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. + 3: [2023-04-29 11:26:45,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +32: [2023-04-29 11:26:45,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +45: [2023-04-29 11:26:45,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +29: [2023-04-29 11:26:45,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 11:26:45,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 11:26:45,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +56: [2023-04-29 11:26:45,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +56: [2023-04-29 11:26:45,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... + 3: [2023-04-29 11:26:45,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +56: [2023-04-29 11:26:45,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +15: [2023-04-29 11:26:45,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +51: [2023-04-29 11:26:45,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +51: [2023-04-29 11:26:45,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +26: [2023-04-29 11:26:45,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +26: [2023-04-29 11:26:45,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 11:26:45,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 11:26:45,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 11:26:45,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +26: [2023-04-29 11:26:45,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +51: [2023-04-29 11:26:45,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +29: [2023-04-29 11:26:45,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +51: [2023-04-29 11:26:45,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +29: [2023-04-29 11:26:45,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 11:26:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 11:26:45,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 11:26:45,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 11:26:45,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +15: [2023-04-29 11:26:45,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +15: [2023-04-29 11:26:45,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +26: [2023-04-29 11:26:45,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 11:26:45,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 11:26:45,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 11:26:45,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 11:26:45,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 11:26:45,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 11:26:45,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +61: [2023-04-29 11:26:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 11:26:45,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 11:26:45,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +43: [2023-04-29 11:26:45,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +26: [2023-04-29 11:26:45,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +14: [2023-04-29 11:26:45,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +26: [2023-04-29 11:26:45,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +26: [2023-04-29 11:26:45,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +61: [2023-04-29 11:26:45,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +61: [2023-04-29 11:26:45,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:45,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:45,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 11:26:45,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 11:26:45,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 11:26:45,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 11:26:45,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 11:26:45,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +14: [2023-04-29 11:26:45,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +43: [2023-04-29 11:26:45,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 11:26:45,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 11:26:45,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 11:26:45,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 11:26:45,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 11:26:45,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +23: [2023-04-29 11:26:45,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 11:26:45,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 11:26:45,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 11:26:45,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 11:26:45,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 11:26:45,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +13: [2023-04-29 11:26:45,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 11:26:45,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 11:26:45,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 11:26:45,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 11:26:45,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 11:26:45,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +49: [2023-04-29 11:26:45,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 11:26:45,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 11:26:45,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 11:26:45,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +19: [2023-04-29 11:26:45,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 11:26:45,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 11:26:45,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +30: [2023-04-29 11:26:45,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +32: [2023-04-29 11:26:45,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +30: [2023-04-29 11:26:45,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 11:26:45,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +23: [2023-04-29 11:26:45,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 11:26:45,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +32: [2023-04-29 11:26:45,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +30: [2023-04-29 11:26:45,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 11:26:45,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 11:26:45,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 11:26:45,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +32: [2023-04-29 11:26:45,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +25: [2023-04-29 11:26:45,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 11:26:45,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 11:26:45,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 11:26:45,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +12: [2023-04-29 11:26:45,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +49: [2023-04-29 11:26:45,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +49: [2023-04-29 11:26:45,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt... +32: [2023-04-29 11:26:45,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 11:26:45,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +53: [2023-04-29 11:26:45,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +53: [2023-04-29 11:26:45,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +53: [2023-04-29 11:26:45,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +19: [2023-04-29 11:26:45,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 11:26:45,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 11:26:45,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +21: [2023-04-29 11:26:45,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 11:26:45,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 11:26:45,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 11:26:45,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +21: [2023-04-29 11:26:45,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +49: [2023-04-29 11:26:45,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +49: [2023-04-29 11:26:45,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +19: [2023-04-29 11:26:45,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 11:26:45,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 11:26:45,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 11:26:45,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 11:26:45,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 11:26:45,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +49: [2023-04-29 11:26:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +22: [2023-04-29 11:26:45,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 11:26:45,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 11:26:45,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 11:26:45,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 11:26:45,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +49: [2023-04-29 11:26:45,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +49: [2023-04-29 11:26:45,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +19: [2023-04-29 11:26:45,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 9: [2023-04-29 11:26:45,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 9: [2023-04-29 11:26:45,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 9: [2023-04-29 11:26:45,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 9: [2023-04-29 11:26:45,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +19: [2023-04-29 11:26:45,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 2: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 2: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 2: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +24: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 2: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +26: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +26: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +26: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 9: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +10: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +10: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +24: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +24: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +12: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +12: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 11:26:45,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +16: [2023-04-29 11:26:45,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +10: [2023-04-29 11:26:45,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +16: [2023-04-29 11:26:45,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +49: [2023-04-29 11:26:45,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +24: [2023-04-29 11:26:45,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +24: [2023-04-29 11:26:45,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 11:26:45,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 11:26:45,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 11:26:45,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 5: [2023-04-29 11:26:45,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 11:26:45,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +52: [2023-04-29 11:26:45,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +52: [2023-04-29 11:26:45,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +52: [2023-04-29 11:26:45,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +52: [2023-04-29 11:26:45,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +25: [2023-04-29 11:26:45,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +56: [2023-04-29 11:26:45,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +12: [2023-04-29 11:26:45,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +12: [2023-04-29 11:26:45,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +36: [2023-04-29 11:26:45,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 11:26:45,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 11:26:45,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 11:26:45,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +25: [2023-04-29 11:26:45,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +51: [2023-04-29 11:26:45,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 11:26:45,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 11:26:45,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 11:26:45,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +22: [2023-04-29 11:26:45,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 11:26:45,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 11:26:45,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +49: [2023-04-29 11:26:45,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +53: [2023-04-29 11:26:45,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +56: [2023-04-29 11:26:45,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +43: [2023-04-29 11:26:45,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +43: [2023-04-29 11:26:45,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +15: [2023-04-29 11:26:45,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +53: [2023-04-29 11:26:45,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 11:26:45,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 11:26:45,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +53: [2023-04-29 11:26:45,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 11:26:45,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +51: [2023-04-29 11:26:45,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +51: [2023-04-29 11:26:45,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 11:26:45,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +51: [2023-04-29 11:26:45,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +51: [2023-04-29 11:26:45,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 11:26:45,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:45,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +43: [2023-04-29 11:26:45,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 11:26:45,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:45,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 11:26:45,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +56: [2023-04-29 11:26:45,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +43: [2023-04-29 11:26:45,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +15: [2023-04-29 11:26:45,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +51: [2023-04-29 11:26:45,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 11:26:45,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt... +43: [2023-04-29 11:26:45,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:45,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:45,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +22: [2023-04-29 11:26:45,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 11:26:45,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +51: [2023-04-29 11:26:45,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 4: [2023-04-29 11:26:45,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +51: [2023-04-29 11:26:45,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +26: [2023-04-29 11:26:45,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +51: [2023-04-29 11:26:45,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +24: [2023-04-29 11:26:45,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +31: [2023-04-29 11:26:45,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 11:26:45,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 11:26:45,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +43: [2023-04-29 11:26:45,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +31: [2023-04-29 11:26:45,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 11:26:45,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 4: [2023-04-29 11:26:45,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +14: [2023-04-29 11:26:45,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +33: [2023-04-29 11:26:45,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +33: [2023-04-29 11:26:45,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +33: [2023-04-29 11:26:45,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +15: [2023-04-29 11:26:45,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +33: [2023-04-29 11:26:45,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +51: [2023-04-29 11:26:45,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +51: [2023-04-29 11:26:45,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +28: [2023-04-29 11:26:45,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 11:26:45,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 11:26:45,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 11:26:45,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +51: [2023-04-29 11:26:45,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 11:26:45,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +20: [2023-04-29 11:26:45,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +52: [2023-04-29 11:26:45,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +31: [2023-04-29 11:26:45,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 11:26:45,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +31: [2023-04-29 11:26:45,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 11:26:45,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 11:26:45,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +31: [2023-04-29 11:26:45,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 11:26:45,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 11:26:45,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 11:26:45,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:45,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 11:26:45,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 11:26:45,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +43: [2023-04-29 11:26:45,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +15: [2023-04-29 11:26:45,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +52: [2023-04-29 11:26:45,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +26: [2023-04-29 11:26:45,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 11:26:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +56: [2023-04-29 11:26:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +24: [2023-04-29 11:26:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +52: [2023-04-29 11:26:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +22: [2023-04-29 11:26:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 11:26:45,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +26: [2023-04-29 11:26:45,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +26: [2023-04-29 11:26:45,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +26: [2023-04-29 11:26:45,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 11:26:45,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +20: [2023-04-29 11:26:45,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +26: [2023-04-29 11:26:45,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 11:26:45,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +56: [2023-04-29 11:26:45,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +51: [2023-04-29 11:26:45,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +26: [2023-04-29 11:26:45,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 11:26:45,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 11:26:45,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 11:26:45,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +19: [2023-04-29 11:26:45,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 11:26:45,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +52: [2023-04-29 11:26:45,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +20: [2023-04-29 11:26:45,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 11:26:45,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 11:26:45,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 11:26:45,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 11:26:45,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 11:26:45,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +24: [2023-04-29 11:26:45,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +43: [2023-04-29 11:26:45,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +43: [2023-04-29 11:26:45,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +24: [2023-04-29 11:26:45,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 11:26:45,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 11:26:45,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 11:26:45,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +49: [2023-04-29 11:26:45,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +56: [2023-04-29 11:26:45,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:45,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +22: [2023-04-29 11:26:45,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +43: [2023-04-29 11:26:45,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +56: [2023-04-29 11:26:45,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:45,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +30: [2023-04-29 11:26:45,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +39: [2023-04-29 11:26:45,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 11:26:45,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 11:26:45,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 11:26:45,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 11:26:45,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +23: [2023-04-29 11:26:45,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +23: [2023-04-29 11:26:45,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +23: [2023-04-29 11:26:45,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 3: [2023-04-29 11:26:45,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 11:26:45,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 11:26:45,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 11:26:45,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 11:26:45,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 11:26:45,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +30: [2023-04-29 11:26:45,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 11:26:45,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 11:26:45,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +54: [2023-04-29 11:26:45,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 11:26:45,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 11:26:45,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +60: [2023-04-29 11:26:45,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 11:26:45,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 11:26:45,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 11:26:45,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 11:26:45,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 11:26:45,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 11:26:45,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +14: [2023-04-29 11:26:45,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +60: [2023-04-29 11:26:45,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 8: [2023-04-29 11:26:45,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 8: [2023-04-29 11:26:45,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +11: [2023-04-29 11:26:45,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 11:26:45,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 11:26:45,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +39: [2023-04-29 11:26:45,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +11: [2023-04-29 11:26:45,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 11:26:45,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 11:26:45,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +54: [2023-04-29 11:26:45,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +39: [2023-04-29 11:26:45,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +33: [2023-04-29 11:26:45,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +33: [2023-04-29 11:26:45,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 11:26:45,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 11:26:45,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +28: [2023-04-29 11:26:45,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 11:26:45,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 11:26:45,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +49: [2023-04-29 11:26:45,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +54: [2023-04-29 11:26:45,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +60: [2023-04-29 11:26:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +60: [2023-04-29 11:26:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +39: [2023-04-29 11:26:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +60: [2023-04-29 11:26:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +54: [2023-04-29 11:26:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +60: [2023-04-29 11:26:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 11:26:45,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +33: [2023-04-29 11:26:45,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +33: [2023-04-29 11:26:45,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +60: [2023-04-29 11:26:45,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +11: [2023-04-29 11:26:45,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 11:26:45,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +54: [2023-04-29 11:26:45,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +21: [2023-04-29 11:26:45,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 11:26:45,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 11:26:45,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +49: [2023-04-29 11:26:45,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_00-model_states.pt. +28: [2023-04-29 11:26:45,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 11:26:45,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +60: [2023-04-29 11:26:45,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +11: [2023-04-29 11:26:45,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +60: [2023-04-29 11:26:45,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +26: [2023-04-29 11:26:45,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 11:26:45,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 11:26:45,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 11:26:45,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 11:26:45,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +60: [2023-04-29 11:26:45,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 11:26:45,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +48: [2023-04-29 11:26:45,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +48: [2023-04-29 11:26:45,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +62: [2023-04-29 11:26:45,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +28: [2023-04-29 11:26:45,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +48: [2023-04-29 11:26:45,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +48: [2023-04-29 11:26:45,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +49: [2023-04-29 11:26:45,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:45,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +62: [2023-04-29 11:26:45,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +62: [2023-04-29 11:26:45,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +62: [2023-04-29 11:26:45,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +62: [2023-04-29 11:26:45,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +62: [2023-04-29 11:26:45,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +14: [2023-04-29 11:26:45,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +49: [2023-04-29 11:26:45,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +43: [2023-04-29 11:26:45,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +36: [2023-04-29 11:26:45,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +51: [2023-04-29 11:26:45,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 11:26:45,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 11:26:45,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 11:26:45,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +30: [2023-04-29 11:26:45,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 11:26:45,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +23: [2023-04-29 11:26:45,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +51: [2023-04-29 11:26:45,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 11:26:45,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +21: [2023-04-29 11:26:45,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 11:26:45,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 11:26:45,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +43: [2023-04-29 11:26:45,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +51: [2023-04-29 11:26:45,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +26: [2023-04-29 11:26:45,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +36: [2023-04-29 11:26:45,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 11:26:45,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:45,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 11:26:45,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 11:26:45,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +26: [2023-04-29 11:26:45,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +36: [2023-04-29 11:26:45,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 11:26:45,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +24: [2023-04-29 11:26:45,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 11:26:45,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 11:26:45,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +43: [2023-04-29 11:26:45,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 11:26:45,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +48: [2023-04-29 11:26:45,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 11:26:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +16: [2023-04-29 11:26:45,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 9: [2023-04-29 11:26:45,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +20: [2023-04-29 11:26:45,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +48: [2023-04-29 11:26:45,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +48: [2023-04-29 11:26:45,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +31: [2023-04-29 11:26:45,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 11:26:45,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +19: [2023-04-29 11:26:45,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +48: [2023-04-29 11:26:45,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:45,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +31: [2023-04-29 11:26:45,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 11:26:45,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 11:26:45,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 11:26:45,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +38: [2023-04-29 11:26:45,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +38: [2023-04-29 11:26:45,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +38: [2023-04-29 11:26:45,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +38: [2023-04-29 11:26:45,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +36: [2023-04-29 11:26:45,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 1: [2023-04-29 11:26:45,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 1: [2023-04-29 11:26:45,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 1: [2023-04-29 11:26:45,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +20: [2023-04-29 11:26:45,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +43: [2023-04-29 11:26:45,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 2: [2023-04-29 11:26:45,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +20: [2023-04-29 11:26:45,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +58: [2023-04-29 11:26:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +58: [2023-04-29 11:26:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +58: [2023-04-29 11:26:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +58: [2023-04-29 11:26:45,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +51: [2023-04-29 11:26:45,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +16: [2023-04-29 11:26:45,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +54: [2023-04-29 11:26:45,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +16: [2023-04-29 11:26:45,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 11:26:45,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 11:26:45,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 11:26:45,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:45,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 2: [2023-04-29 11:26:45,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +43: [2023-04-29 11:26:45,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +24: [2023-04-29 11:26:45,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 0: [2023-04-29 11:26:45,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 0: [2023-04-29 11:26:45,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 0: [2023-04-29 11:26:45,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 9: [2023-04-29 11:26:45,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 11:26:45,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +51: [2023-04-29 11:26:45,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 11:26:45,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +39: [2023-04-29 11:26:45,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +16: [2023-04-29 11:26:45,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 11:26:45,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +51: [2023-04-29 11:26:45,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 11:26:45,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +26: [2023-04-29 11:26:45,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 11:26:45,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 9: [2023-04-29 11:26:45,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +24: [2023-04-29 11:26:45,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +36: [2023-04-29 11:26:45,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 11:26:45,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +24: [2023-04-29 11:26:45,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 9: [2023-04-29 11:26:45,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +60: [2023-04-29 11:26:45,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 2: [2023-04-29 11:26:45,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +36: [2023-04-29 11:26:45,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +24: [2023-04-29 11:26:45,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 2: [2023-04-29 11:26:45,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +26: [2023-04-29 11:26:45,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 11:26:45,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 11:26:45,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +20: [2023-04-29 11:26:45,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 11:26:45,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 11:26:45,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +26: [2023-04-29 11:26:45,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +54: [2023-04-29 11:26:45,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +26: [2023-04-29 11:26:45,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 4: [2023-04-29 11:26:45,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +60: [2023-04-29 11:26:45,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 7: [2023-04-29 11:26:45,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +39: [2023-04-29 11:26:45,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +26: [2023-04-29 11:26:45,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +19: [2023-04-29 11:26:45,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 11:26:45,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 7: [2023-04-29 11:26:45,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +20: [2023-04-29 11:26:45,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 11:26:45,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +31: [2023-04-29 11:26:45,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 11:26:45,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +26: [2023-04-29 11:26:45,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +31: [2023-04-29 11:26:45,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 11:26:45,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 11:26:45,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 11:26:45,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +58: [2023-04-29 11:26:45,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +31: [2023-04-29 11:26:45,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +38: [2023-04-29 11:26:45,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +62: [2023-04-29 11:26:45,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +11: [2023-04-29 11:26:45,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 11:26:45,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 11:26:45,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +38: [2023-04-29 11:26:45,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +20: [2023-04-29 11:26:45,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +38: [2023-04-29 11:26:45,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +47: [2023-04-29 11:26:45,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +47: [2023-04-29 11:26:45,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. + 4: [2023-04-29 11:26:45,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +58: [2023-04-29 11:26:45,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +58: [2023-04-29 11:26:45,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +47: [2023-04-29 11:26:45,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +47: [2023-04-29 11:26:45,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +38: [2023-04-29 11:26:45,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 11:26:45,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +62: [2023-04-29 11:26:45,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 11:26:45,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +19: [2023-04-29 11:26:45,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +60: [2023-04-29 11:26:45,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 11:26:45,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +60: [2023-04-29 11:26:45,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 11:26:45,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +23: [2023-04-29 11:26:45,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +23: [2023-04-29 11:26:45,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +39: [2023-04-29 11:26:45,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 11:26:45,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +39: [2023-04-29 11:26:45,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +54: [2023-04-29 11:26:45,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +10: [2023-04-29 11:26:45,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 11:26:45,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 11:26:45,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 11:26:45,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 11:26:45,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +23: [2023-04-29 11:26:45,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +23: [2023-04-29 11:26:45,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +23: [2023-04-29 11:26:45,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 7: [2023-04-29 11:26:45,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 11:26:45,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 11:26:45,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 11:26:45,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +55: [2023-04-29 11:26:45,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 11:26:45,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 11:26:45,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +10: [2023-04-29 11:26:45,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +55: [2023-04-29 11:26:45,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 11:26:45,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 11:26:45,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +10: [2023-04-29 11:26:45,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +47: [2023-04-29 11:26:45,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 11:26:45,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +47: [2023-04-29 11:26:45,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +47: [2023-04-29 11:26:45,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +47: [2023-04-29 11:26:45,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 11:26:45,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +39: [2023-04-29 11:26:45,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 11:26:45,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +62: [2023-04-29 11:26:45,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 11:26:45,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 11:26:45,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +62: [2023-04-29 11:26:45,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 11:26:45,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +11: [2023-04-29 11:26:45,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 11:26:45,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +41: [2023-04-29 11:26:45,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +41: [2023-04-29 11:26:45,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +41: [2023-04-29 11:26:45,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +41: [2023-04-29 11:26:45,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +60: [2023-04-29 11:26:45,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 8: [2023-04-29 11:26:45,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 8: [2023-04-29 11:26:45,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +62: [2023-04-29 11:26:45,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 11:26:45,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 11:26:45,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:45,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +29: [2023-04-29 11:26:45,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +29: [2023-04-29 11:26:45,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +29: [2023-04-29 11:26:45,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +27: [2023-04-29 11:26:45,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +27: [2023-04-29 11:26:45,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +27: [2023-04-29 11:26:45,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +27: [2023-04-29 11:26:45,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +30: [2023-04-29 11:26:45,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +30: [2023-04-29 11:26:45,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +30: [2023-04-29 11:26:45,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +30: [2023-04-29 11:26:45,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +41: [2023-04-29 11:26:45,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +41: [2023-04-29 11:26:45,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +41: [2023-04-29 11:26:45,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +41: [2023-04-29 11:26:45,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 1: [2023-04-29 11:26:45,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 1: [2023-04-29 11:26:45,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 6: [2023-04-29 11:26:45,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +35: [2023-04-29 11:26:45,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +35: [2023-04-29 11:26:45,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +35: [2023-04-29 11:26:45,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +35: [2023-04-29 11:26:45,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +29: [2023-04-29 11:26:45,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:45,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 11:26:45,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:45,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 11:26:45,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +30: [2023-04-29 11:26:45,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +29: [2023-04-29 11:26:45,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 11:26:45,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 11:26:45,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +17: [2023-04-29 11:26:45,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +17: [2023-04-29 11:26:45,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +17: [2023-04-29 11:26:45,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +30: [2023-04-29 11:26:45,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 11:26:45,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 11:26:45,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +55: [2023-04-29 11:26:45,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 11:26:45,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +18: [2023-04-29 11:26:45,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +27: [2023-04-29 11:26:45,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +18: [2023-04-29 11:26:45,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +18: [2023-04-29 11:26:45,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 11:26:45,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 11:26:45,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 11:26:45,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +55: [2023-04-29 11:26:45,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 11:26:45,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +55: [2023-04-29 11:26:45,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +27: [2023-04-29 11:26:45,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 11:26:45,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +63: [2023-04-29 11:26:45,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 11:26:45,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 11:26:45,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 11:26:45,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 11:26:45,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 11:26:45,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +63: [2023-04-29 11:26:45,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 11:26:45,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 11:26:45,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +63: [2023-04-29 11:26:45,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 11:26:45,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +63: [2023-04-29 11:26:45,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 11:26:45,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +10: [2023-04-29 11:26:45,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +35: [2023-04-29 11:26:45,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 11:26:45,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 11:26:45,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 11:26:45,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +10: [2023-04-29 11:26:45,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +55: [2023-04-29 11:26:45,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +17: [2023-04-29 11:26:45,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 11:26:45,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 11:26:45,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 11:26:45,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 11:26:45,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +55: [2023-04-29 11:26:45,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 11:26:45,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 11:26:45,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +42: [2023-04-29 11:26:45,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +42: [2023-04-29 11:26:45,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +42: [2023-04-29 11:26:45,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +46: [2023-04-29 11:26:45,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +46: [2023-04-29 11:26:45,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +46: [2023-04-29 11:26:45,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +46: [2023-04-29 11:26:45,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +55: [2023-04-29 11:26:45,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +18: [2023-04-29 11:26:45,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +44: [2023-04-29 11:26:45,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +44: [2023-04-29 11:26:45,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +44: [2023-04-29 11:26:45,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +44: [2023-04-29 11:26:45,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +61: [2023-04-29 11:26:45,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 11:26:45,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 11:26:45,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 11:26:45,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 11:26:45,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 11:26:45,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 11:26:45,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 11:26:45,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 11:26:45,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +61: [2023-04-29 11:26:45,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 11:26:45,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 11:26:45,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +61: [2023-04-29 11:26:45,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 0: [2023-04-29 11:26:45,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +61: [2023-04-29 11:26:45,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 11:26:45,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 0: [2023-04-29 11:26:45,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +61: [2023-04-29 11:26:45,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 11:26:45,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +61: [2023-04-29 11:26:45,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +10: [2023-04-29 11:26:45,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +61: [2023-04-29 11:26:45,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +61: [2023-04-29 11:26:45,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 0: [2023-04-29 11:26:45,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 0: [2023-04-29 11:26:45,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +37: [2023-04-29 11:26:45,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +37: [2023-04-29 11:26:45,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +37: [2023-04-29 11:26:45,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +37: [2023-04-29 11:26:45,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +32: [2023-04-29 11:26:45,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 11:26:45,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 11:26:45,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 11:26:45,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 11:26:45,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 11:26:45,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 11:26:45,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 11:26:45,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 11:26:45,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +32: [2023-04-29 11:26:45,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +42: [2023-04-29 11:26:45,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +42: [2023-04-29 11:26:45,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +30: [2023-04-29 11:26:45,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +46: [2023-04-29 11:26:45,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +46: [2023-04-29 11:26:45,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +42: [2023-04-29 11:26:45,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +46: [2023-04-29 11:26:45,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +42: [2023-04-29 11:26:45,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +46: [2023-04-29 11:26:45,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +32: [2023-04-29 11:26:45,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 6: [2023-04-29 11:26:45,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +44: [2023-04-29 11:26:45,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +29: [2023-04-29 11:26:45,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 11:26:45,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +19: [2023-04-29 11:26:45,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +27: [2023-04-29 11:26:45,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 11:26:45,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 11:26:45,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +32: [2023-04-29 11:26:45,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +19: [2023-04-29 11:26:45,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +32: [2023-04-29 11:26:45,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +32: [2023-04-29 11:26:45,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +32: [2023-04-29 11:26:45,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 11:26:45,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +14: [2023-04-29 11:26:45,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +14: [2023-04-29 11:26:45,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +14: [2023-04-29 11:26:45,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +32: [2023-04-29 11:26:45,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +32: [2023-04-29 11:26:45,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 11:26:45,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +30: [2023-04-29 11:26:45,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +44: [2023-04-29 11:26:45,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +19: [2023-04-29 11:26:45,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +29: [2023-04-29 11:26:45,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +44: [2023-04-29 11:26:45,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +29: [2023-04-29 11:26:45,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 11:26:45,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 11:26:45,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +27: [2023-04-29 11:26:45,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 11:26:45,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +27: [2023-04-29 11:26:45,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +27: [2023-04-29 11:26:45,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +63: [2023-04-29 11:26:45,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +30: [2023-04-29 11:26:45,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +53: [2023-04-29 11:26:45,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 11:26:45,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 11:26:45,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 11:26:45,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 11:26:45,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 11:26:45,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 11:26:45,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 11:26:45,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 11:26:45,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +30: [2023-04-29 11:26:45,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +30: [2023-04-29 11:26:45,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +45: [2023-04-29 11:26:45,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 11:26:45,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 11:26:45,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 11:26:45,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +27: [2023-04-29 11:26:45,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +27: [2023-04-29 11:26:45,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +22: [2023-04-29 11:26:45,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +22: [2023-04-29 11:26:45,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +22: [2023-04-29 11:26:45,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +29: [2023-04-29 11:26:45,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +29: [2023-04-29 11:26:45,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +22: [2023-04-29 11:26:45,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +31: [2023-04-29 11:26:45,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +31: [2023-04-29 11:26:45,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +31: [2023-04-29 11:26:45,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +31: [2023-04-29 11:26:45,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 4: [2023-04-29 11:26:45,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 4: [2023-04-29 11:26:45,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +30: [2023-04-29 11:26:45,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 4: [2023-04-29 11:26:45,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +53: [2023-04-29 11:26:45,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +53: [2023-04-29 11:26:45,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +53: [2023-04-29 11:26:45,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +13: [2023-04-29 11:26:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +53: [2023-04-29 11:26:45,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +13: [2023-04-29 11:26:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +13: [2023-04-29 11:26:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +13: [2023-04-29 11:26:45,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +37: [2023-04-29 11:26:45,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 11:26:45,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 11:26:45,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +29: [2023-04-29 11:26:45,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +45: [2023-04-29 11:26:45,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 11:26:45,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 11:26:45,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 11:26:45,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 11:26:45,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +53: [2023-04-29 11:26:45,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 11:26:45,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +17: [2023-04-29 11:26:45,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +45: [2023-04-29 11:26:45,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 11:26:45,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +37: [2023-04-29 11:26:45,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 11:26:45,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 11:26:45,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 11:26:45,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 11:26:45,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +50: [2023-04-29 11:26:45,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +50: [2023-04-29 11:26:45,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +17: [2023-04-29 11:26:45,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +50: [2023-04-29 11:26:45,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +50: [2023-04-29 11:26:45,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +17: [2023-04-29 11:26:45,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +34: [2023-04-29 11:26:45,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +34: [2023-04-29 11:26:45,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. + 6: [2023-04-29 11:26:45,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +34: [2023-04-29 11:26:45,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +34: [2023-04-29 11:26:45,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +14: [2023-04-29 11:26:45,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 11:26:45,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 6: [2023-04-29 11:26:45,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 11:26:45,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 11:26:45,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +14: [2023-04-29 11:26:45,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +18: [2023-04-29 11:26:45,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 7: [2023-04-29 11:26:45,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 11:26:45,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 11:26:45,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 11:26:45,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +45: [2023-04-29 11:26:45,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +45: [2023-04-29 11:26:45,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +45: [2023-04-29 11:26:45,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +45: [2023-04-29 11:26:45,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +17: [2023-04-29 11:26:45,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +63: [2023-04-29 11:26:45,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 11:26:45,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 7: [2023-04-29 11:26:45,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 7: [2023-04-29 11:26:45,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 11:26:45,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 11:26:45,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +63: [2023-04-29 11:26:45,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +22: [2023-04-29 11:26:45,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +22: [2023-04-29 11:26:45,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +39: [2023-04-29 11:26:45,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +39: [2023-04-29 11:26:45,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +39: [2023-04-29 11:26:45,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +39: [2023-04-29 11:26:45,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. + 7: [2023-04-29 11:26:45,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +55: [2023-04-29 11:26:45,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +55: [2023-04-29 11:26:45,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +17: [2023-04-29 11:26:45,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +18: [2023-04-29 11:26:45,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +40: [2023-04-29 11:26:45,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +40: [2023-04-29 11:26:45,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +40: [2023-04-29 11:26:45,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +18: [2023-04-29 11:26:45,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +36: [2023-04-29 11:26:45,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +36: [2023-04-29 11:26:45,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +57: [2023-04-29 11:26:45,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +57: [2023-04-29 11:26:45,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +40: [2023-04-29 11:26:45,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +57: [2023-04-29 11:26:45,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +59: [2023-04-29 11:26:45,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +59: [2023-04-29 11:26:45,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +31: [2023-04-29 11:26:45,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +31: [2023-04-29 11:26:45,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +57: [2023-04-29 11:26:45,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +55: [2023-04-29 11:26:45,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +55: [2023-04-29 11:26:45,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. + 0: [2023-04-29 11:26:45,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 11:26:45,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +22: [2023-04-29 11:26:45,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +31: [2023-04-29 11:26:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +36: [2023-04-29 11:26:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +59: [2023-04-29 11:26:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +31: [2023-04-29 11:26:45,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +36: [2023-04-29 11:26:45,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +59: [2023-04-29 11:26:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +61: [2023-04-29 11:26:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 11:26:45,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +33: [2023-04-29 11:26:45,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +13: [2023-04-29 11:26:45,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 11:26:45,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +33: [2023-04-29 11:26:45,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 11:26:45,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 11:26:45,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 11:26:45,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 11:26:45,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 11:26:45,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +13: [2023-04-29 11:26:45,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +33: [2023-04-29 11:26:45,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 11:26:45,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +34: [2023-04-29 11:26:45,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 11:26:45,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +61: [2023-04-29 11:26:45,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 11:26:45,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 11:26:45,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +33: [2023-04-29 11:26:45,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +63: [2023-04-29 11:26:45,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 11:26:45,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +33: [2023-04-29 11:26:45,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 11:26:45,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +33: [2023-04-29 11:26:45,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +33: [2023-04-29 11:26:45,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +33: [2023-04-29 11:26:45,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +33: [2023-04-29 11:26:45,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 11:26:45,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 11:26:45,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +33: [2023-04-29 11:26:45,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 11:26:45,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 11:26:45,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 11:26:45,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +33: [2023-04-29 11:26:45,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +34: [2023-04-29 11:26:45,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 11:26:45,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 11:26:45,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +18: [2023-04-29 11:26:45,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +18: [2023-04-29 11:26:45,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 11:26:45,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +25: [2023-04-29 11:26:45,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +25: [2023-04-29 11:26:45,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +25: [2023-04-29 11:26:45,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +23: [2023-04-29 11:26:45,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 11:26:45,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 11:26:45,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 11:26:45,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 11:26:45,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +12: [2023-04-29 11:26:45,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 11:26:45,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 11:26:45,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 11:26:45,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 11:26:45,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 11:26:45,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +27: [2023-04-29 11:26:45,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 11:26:45,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 11:26:45,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 11:26:45,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +45: [2023-04-29 11:26:45,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 11:26:45,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 11:26:45,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +12: [2023-04-29 11:26:45,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +12: [2023-04-29 11:26:45,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 1: [2023-04-29 11:26:45,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 11:26:45,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +12: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +39: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +39: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +45: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +36: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 11:26:45,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 11:26:45,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 11:26:45,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 11:26:45,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +40: [2023-04-29 11:26:45,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +53: [2023-04-29 11:26:45,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 11:26:45,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 11:26:45,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +10: [2023-04-29 11:26:45,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +10: [2023-04-29 11:26:45,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +10: [2023-04-29 11:26:45,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +39: [2023-04-29 11:26:45,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +39: [2023-04-29 11:26:45,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +23: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +36: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +12: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +57: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +57: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +13: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +15: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +24: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 11:26:45,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +45: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +24: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +12: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +55: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +27: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +23: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +40: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +40: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +18: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +15: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +36: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +15: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +29: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 1: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +29: [2023-04-29 11:26:45,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +29: [2023-04-29 11:26:45,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +21: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +21: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +15: [2023-04-29 11:26:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 11:26:45,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 11:26:45,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +17: [2023-04-29 11:26:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 11:26:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 11:26:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 11:26:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 11:26:45,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +29: [2023-04-29 11:26:45,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 11:26:45,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +16: [2023-04-29 11:26:45,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +61: [2023-04-29 11:26:45,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 11:26:45,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +57: [2023-04-29 11:26:45,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +16: [2023-04-29 11:26:45,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +40: [2023-04-29 11:26:45,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +61: [2023-04-29 11:26:45,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +59: [2023-04-29 11:26:45,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +24: [2023-04-29 11:26:45,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 11:26:45,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +55: [2023-04-29 11:26:45,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +17: [2023-04-29 11:26:45,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 11:26:45,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 11:26:45,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 11:26:45,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 11:26:45,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +32: [2023-04-29 11:26:45,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 11:26:45,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 11:26:45,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 11:26:45,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +29: [2023-04-29 11:26:45,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 11:26:45,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 11:26:45,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +29: [2023-04-29 11:26:45,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +61: [2023-04-29 11:26:45,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 11:26:45,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +29: [2023-04-29 11:26:45,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +61: [2023-04-29 11:26:45,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 11:26:45,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +24: [2023-04-29 11:26:45,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +24: [2023-04-29 11:26:45,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +24: [2023-04-29 11:26:45,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +24: [2023-04-29 11:26:45,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 0: [2023-04-29 11:26:45,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +53: [2023-04-29 11:26:45,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 11:26:45,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +25: [2023-04-29 11:26:45,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +45: [2023-04-29 11:26:45,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +14: [2023-04-29 11:26:45,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 11:26:45,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +40: [2023-04-29 11:26:45,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 11:26:45,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 11:26:45,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 11:26:45,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +25: [2023-04-29 11:26:45,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +25: [2023-04-29 11:26:45,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +25: [2023-04-29 11:26:45,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +37: [2023-04-29 11:26:45,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 11:26:45,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 11:26:45,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 11:26:45,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 11:26:45,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 11:26:45,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +45: [2023-04-29 11:26:45,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 11:26:45,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 11:26:45,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +53: [2023-04-29 11:26:45,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +40: [2023-04-29 11:26:45,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 11:26:45,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 11:26:45,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +12: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 11:26:45,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +37: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 11:26:45,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +40: [2023-04-29 11:26:45,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +40: [2023-04-29 11:26:45,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +11: [2023-04-29 11:26:45,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +11: [2023-04-29 11:26:45,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +11: [2023-04-29 11:26:45,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +37: [2023-04-29 11:26:45,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +11: [2023-04-29 11:26:45,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +37: [2023-04-29 11:26:45,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +34: [2023-04-29 11:26:45,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 11:26:45,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 11:26:45,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 11:26:45,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +14: [2023-04-29 11:26:45,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +37: [2023-04-29 11:26:45,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +21: [2023-04-29 11:26:45,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 11:26:45,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +40: [2023-04-29 11:26:45,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 11:26:45,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +37: [2023-04-29 11:26:45,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 11:26:45,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 11:26:45,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 11:26:45,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 11:26:45,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +25: [2023-04-29 11:26:45,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +22: [2023-04-29 11:26:45,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +34: [2023-04-29 11:26:45,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 11:26:45,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 8: [2023-04-29 11:26:45,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 11:26:45,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 11:26:45,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 11:26:45,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 11:26:45,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 11:26:45,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 11:26:45,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +15: [2023-04-29 11:26:45,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 11:26:45,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +26: [2023-04-29 11:26:45,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 7: [2023-04-29 11:26:45,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 11:26:45,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +37: [2023-04-29 11:26:45,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +26: [2023-04-29 11:26:45,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +19: [2023-04-29 11:26:45,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +34: [2023-04-29 11:26:45,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +21: [2023-04-29 11:26:45,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +14: [2023-04-29 11:26:45,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +34: [2023-04-29 11:26:45,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 11:26:45,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 11:26:45,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 11:26:45,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 11:26:45,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +14: [2023-04-29 11:26:45,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +15: [2023-04-29 11:26:45,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +37: [2023-04-29 11:26:45,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +15: [2023-04-29 11:26:45,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +34: [2023-04-29 11:26:45,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 11:26:45,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 7: [2023-04-29 11:26:45,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 11:26:45,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +53: [2023-04-29 11:26:45,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +33: [2023-04-29 11:26:45,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +32: [2023-04-29 11:26:45,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +22: [2023-04-29 11:26:45,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +32: [2023-04-29 11:26:45,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +24: [2023-04-29 11:26:45,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +19: [2023-04-29 11:26:45,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +19: [2023-04-29 11:26:45,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +32: [2023-04-29 11:26:45,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +32: [2023-04-29 11:26:45,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +16: [2023-04-29 11:26:45,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +16: [2023-04-29 11:26:45,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +21: [2023-04-29 11:26:45,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 11:26:45,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 11:26:45,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 11:26:45,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +53: [2023-04-29 11:26:45,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +33: [2023-04-29 11:26:45,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 11:26:45,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +53: [2023-04-29 11:26:45,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 11:26:45,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +31: [2023-04-29 11:26:45,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 11:26:45,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 11:26:45,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +34: [2023-04-29 11:26:45,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 11:26:45,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 11:26:45,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 11:26:45,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 11:26:45,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +13: [2023-04-29 11:26:45,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +48: [2023-04-29 11:26:45,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +48: [2023-04-29 11:26:45,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 11:26:45,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 11:26:45,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 11:26:45,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +16: [2023-04-29 11:26:45,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +48: [2023-04-29 11:26:45,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +30: [2023-04-29 11:26:45,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 11:26:45,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 11:26:45,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 11:26:45,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +21: [2023-04-29 11:26:45,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +30: [2023-04-29 11:26:45,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +21: [2023-04-29 11:26:45,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 11:26:45,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 11:26:45,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 11:26:45,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +45: [2023-04-29 11:26:45,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +45: [2023-04-29 11:26:45,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 11:26:45,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +22: [2023-04-29 11:26:45,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 11:26:45,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +34: [2023-04-29 11:26:45,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +24: [2023-04-29 11:26:45,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +24: [2023-04-29 11:26:45,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 11:26:45,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +48: [2023-04-29 11:26:45,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +31: [2023-04-29 11:26:45,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +31: [2023-04-29 11:26:45,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 5: [2023-04-29 11:26:45,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +36: [2023-04-29 11:26:45,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +13: [2023-04-29 11:26:45,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +48: [2023-04-29 11:26:45,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 11:26:45,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +48: [2023-04-29 11:26:45,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +30: [2023-04-29 11:26:45,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 11:26:45,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 11:26:45,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +30: [2023-04-29 11:26:45,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +48: [2023-04-29 11:26:45,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +48: [2023-04-29 11:26:45,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +48: [2023-04-29 11:26:45,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +55: [2023-04-29 11:26:45,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +30: [2023-04-29 11:26:45,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +48: [2023-04-29 11:26:45,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 11:26:45,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +48: [2023-04-29 11:26:45,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 4: [2023-04-29 11:26:45,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 5: [2023-04-29 11:26:45,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +33: [2023-04-29 11:26:45,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +36: [2023-04-29 11:26:45,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +11: [2023-04-29 11:26:45,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 11:26:45,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 11:26:45,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +13: [2023-04-29 11:26:45,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +22: [2023-04-29 11:26:45,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +55: [2023-04-29 11:26:45,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 2: [2023-04-29 11:26:45,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 2: [2023-04-29 11:26:45,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 2: [2023-04-29 11:26:45,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 2: [2023-04-29 11:26:45,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +13: [2023-04-29 11:26:45,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +26: [2023-04-29 11:26:45,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 11:26:45,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 11:26:45,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +36: [2023-04-29 11:26:45,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +11: [2023-04-29 11:26:45,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +13: [2023-04-29 11:26:45,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 11:26:45,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +39: [2023-04-29 11:26:45,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +13: [2023-04-29 11:26:45,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +36: [2023-04-29 11:26:45,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +16: [2023-04-29 11:26:45,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 6: [2023-04-29 11:26:45,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 6: [2023-04-29 11:26:45,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 6: [2023-04-29 11:26:45,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +11: [2023-04-29 11:26:45,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +55: [2023-04-29 11:26:45,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +40: [2023-04-29 11:26:45,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +11: [2023-04-29 11:26:45,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 11:26:45,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 3: [2023-04-29 11:26:45,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. + 3: [2023-04-29 11:26:45,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +26: [2023-04-29 11:26:45,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +36: [2023-04-29 11:26:45,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +36: [2023-04-29 11:26:45,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 11:26:45,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +26: [2023-04-29 11:26:45,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +23: [2023-04-29 11:26:45,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 11:26:45,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +39: [2023-04-29 11:26:45,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +34: [2023-04-29 11:26:45,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +16: [2023-04-29 11:26:45,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +36: [2023-04-29 11:26:45,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +13: [2023-04-29 11:26:45,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +23: [2023-04-29 11:26:45,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +55: [2023-04-29 11:26:45,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +33: [2023-04-29 11:26:45,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +45: [2023-04-29 11:26:45,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +26: [2023-04-29 11:26:45,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +39: [2023-04-29 11:26:45,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 11:26:45,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 11:26:45,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 11:26:45,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +39: [2023-04-29 11:26:45,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +27: [2023-04-29 11:26:45,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 11:26:45,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 11:26:45,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +36: [2023-04-29 11:26:45,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +16: [2023-04-29 11:26:45,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 11:26:45,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 11:26:45,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +34: [2023-04-29 11:26:45,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 11:26:45,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 11:26:45,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +12: [2023-04-29 11:26:45,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +40: [2023-04-29 11:26:45,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +29: [2023-04-29 11:26:45,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +45: [2023-04-29 11:26:45,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +11: [2023-04-29 11:26:45,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 11:26:45,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 11:26:45,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 11:26:45,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +45: [2023-04-29 11:26:45,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 11:26:45,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 11:26:45,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +45: [2023-04-29 11:26:45,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +39: [2023-04-29 11:26:45,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +55: [2023-04-29 11:26:45,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 11:26:45,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +28: [2023-04-29 11:26:45,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +28: [2023-04-29 11:26:45,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +28: [2023-04-29 11:26:45,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +28: [2023-04-29 11:26:45,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +40: [2023-04-29 11:26:45,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 11:26:45,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 11:26:45,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 11:26:45,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 11:26:45,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 11:26:45,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +33: [2023-04-29 11:26:45,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 11:26:45,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 11:26:45,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 11:26:45,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +34: [2023-04-29 11:26:45,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +13: [2023-04-29 11:26:45,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +29: [2023-04-29 11:26:45,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +29: [2023-04-29 11:26:45,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 11:26:45,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +40: [2023-04-29 11:26:45,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +45: [2023-04-29 11:26:45,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +16: [2023-04-29 11:26:45,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +40: [2023-04-29 11:26:45,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +59: [2023-04-29 11:26:45,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 11:26:45,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 11:26:45,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 11:26:45,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 11:26:45,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 11:26:45,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 11:26:45,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 11:26:45,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 11:26:45,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +12: [2023-04-29 11:26:45,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 11:26:45,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 11:26:45,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 11:26:45,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 11:26:45,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +55: [2023-04-29 11:26:45,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +25: [2023-04-29 11:26:45,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +50: [2023-04-29 11:26:45,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 11:26:45,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +50: [2023-04-29 11:26:45,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +50: [2023-04-29 11:26:45,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +50: [2023-04-29 11:26:45,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +40: [2023-04-29 11:26:45,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +34: [2023-04-29 11:26:45,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +13: [2023-04-29 11:26:45,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 11:26:45,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +40: [2023-04-29 11:26:45,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 11:26:45,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +59: [2023-04-29 11:26:45,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +59: [2023-04-29 11:26:45,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +45: [2023-04-29 11:26:45,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +45: [2023-04-29 11:26:45,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +27: [2023-04-29 11:26:45,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +59: [2023-04-29 11:26:45,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 9: [2023-04-29 11:26:45,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +50: [2023-04-29 11:26:45,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 11:26:45,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +50: [2023-04-29 11:26:45,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +12: [2023-04-29 11:26:45,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +33: [2023-04-29 11:26:45,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +12: [2023-04-29 11:26:45,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 11:26:45,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +34: [2023-04-29 11:26:45,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +16: [2023-04-29 11:26:45,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 11:26:45,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +11: [2023-04-29 11:26:45,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 11:26:45,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +55: [2023-04-29 11:26:45,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +11: [2023-04-29 11:26:45,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 11:26:45,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 11:26:45,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 11:26:45,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 11:26:45,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +59: [2023-04-29 11:26:45,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 11:26:45,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +59: [2023-04-29 11:26:45,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +49: [2023-04-29 11:26:45,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +49: [2023-04-29 11:26:45,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. + 3: [2023-04-29 11:26:45,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +59: [2023-04-29 11:26:45,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +16: [2023-04-29 11:26:45,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +59: [2023-04-29 11:26:45,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +45: [2023-04-29 11:26:45,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +16: [2023-04-29 11:26:45,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 8: [2023-04-29 11:26:45,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 8: [2023-04-29 11:26:45,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +49: [2023-04-29 11:26:45,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +25: [2023-04-29 11:26:45,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +49: [2023-04-29 11:26:45,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. + 6: [2023-04-29 11:26:45,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +45: [2023-04-29 11:26:45,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 8: [2023-04-29 11:26:45,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 11:26:45,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 11:26:45,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +21: [2023-04-29 11:26:45,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 11:26:45,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 11:26:45,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 11:26:45,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 3: [2023-04-29 11:26:45,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +40: [2023-04-29 11:26:45,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +40: [2023-04-29 11:26:45,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +15: [2023-04-29 11:26:45,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 11:26:45,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:45,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +37: [2023-04-29 11:26:45,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +37: [2023-04-29 11:26:45,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +44: [2023-04-29 11:26:45,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 11:26:45,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 11:26:45,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 11:26:45,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 11:26:45,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 11:26:45,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 11:26:45,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 11:26:45,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +24: [2023-04-29 11:26:45,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 11:26:45,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +40: [2023-04-29 11:26:45,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +21: [2023-04-29 11:26:45,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 4: [2023-04-29 11:26:45,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 11:26:45,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 11:26:45,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +37: [2023-04-29 11:26:45,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 11:26:45,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 11:26:45,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 11:26:45,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +12: [2023-04-29 11:26:45,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:45,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 11:26:45,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 11:26:45,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 11:26:45,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 11:26:45,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +21: [2023-04-29 11:26:45,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +25: [2023-04-29 11:26:45,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +12: [2023-04-29 11:26:45,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +15: [2023-04-29 11:26:45,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +34: [2023-04-29 11:26:45,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 11:26:45,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +23: [2023-04-29 11:26:45,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 11:26:45,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 11:26:45,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +44: [2023-04-29 11:26:45,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +12: [2023-04-29 11:26:45,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 11:26:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +23: [2023-04-29 11:26:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +23: [2023-04-29 11:26:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +21: [2023-04-29 11:26:45,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 11:26:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +34: [2023-04-29 11:26:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 11:26:45,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +27: [2023-04-29 11:26:45,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 1: [2023-04-29 11:26:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +21: [2023-04-29 11:26:45,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 1: [2023-04-29 11:26:45,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +10: [2023-04-29 11:26:45,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 11:26:45,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 11:26:45,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 11:26:45,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +27: [2023-04-29 11:26:45,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +44: [2023-04-29 11:26:45,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 11:26:45,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +27: [2023-04-29 11:26:45,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +44: [2023-04-29 11:26:45,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +15: [2023-04-29 11:26:45,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +37: [2023-04-29 11:26:45,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 11:26:45,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 11:26:45,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +28: [2023-04-29 11:26:45,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +12: [2023-04-29 11:26:45,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 1: [2023-04-29 11:26:45,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +44: [2023-04-29 11:26:45,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 11:26:45,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 11:26:45,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +44: [2023-04-29 11:26:45,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +40: [2023-04-29 11:26:45,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +28: [2023-04-29 11:26:45,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 11:26:45,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 11:26:45,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +21: [2023-04-29 11:26:45,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +21: [2023-04-29 11:26:45,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +29: [2023-04-29 11:26:45,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:45,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 11:26:45,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 11:26:45,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 11:26:45,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 11:26:45,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 11:26:45,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 11:26:45,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 11:26:45,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 11:26:45,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +24: [2023-04-29 11:26:45,700] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +19: [2023-04-29 11:26:45,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 11:26:45,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 11:26:45,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +13: [2023-04-29 11:26:45,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +34: [2023-04-29 11:26:45,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +10: [2023-04-29 11:26:45,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +10: [2023-04-29 11:26:45,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +10: [2023-04-29 11:26:45,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +49: [2023-04-29 11:26:45,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +22: [2023-04-29 11:26:45,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 11:26:45,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +48: [2023-04-29 11:26:45,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 11:26:45,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +28: [2023-04-29 11:26:45,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 11:26:45,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 11:26:45,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 11:26:45,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +12: [2023-04-29 11:26:45,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 11:26:45,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 11:26:45,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 11:26:45,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 11:26:45,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 11:26:45,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +49: [2023-04-29 11:26:45,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +19: [2023-04-29 11:26:45,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +49: [2023-04-29 11:26:45,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 11:26:45,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +63: [2023-04-29 11:26:45,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +13: [2023-04-29 11:26:45,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 11:26:45,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 11:26:45,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +19: [2023-04-29 11:26:45,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +49: [2023-04-29 11:26:45,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +19: [2023-04-29 11:26:45,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 11:26:45,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 11:26:45,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 11:26:45,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +63: [2023-04-29 11:26:45,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +63: [2023-04-29 11:26:45,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. + 9: [2023-04-29 11:26:45,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 11:26:45,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 11:26:45,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 11:26:45,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +22: [2023-04-29 11:26:45,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 11:26:45,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 11:26:45,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +40: [2023-04-29 11:26:45,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 11:26:45,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +48: [2023-04-29 11:26:45,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +30: [2023-04-29 11:26:45,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +34: [2023-04-29 11:26:45,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +22: [2023-04-29 11:26:45,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 11:26:45,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +37: [2023-04-29 11:26:45,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +15: [2023-04-29 11:26:45,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +40: [2023-04-29 11:26:45,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +15: [2023-04-29 11:26:45,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 11:26:45,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +37: [2023-04-29 11:26:45,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +30: [2023-04-29 11:26:45,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +37: [2023-04-29 11:26:45,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +40: [2023-04-29 11:26:45,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +30: [2023-04-29 11:26:45,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 11:26:45,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 11:26:45,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 11:26:45,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 11:26:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +14: [2023-04-29 11:26:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +14: [2023-04-29 11:26:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +58: [2023-04-29 11:26:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 11:26:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 11:26:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 11:26:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 11:26:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 11:26:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 11:26:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +26: [2023-04-29 11:26:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 11:26:45,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +58: [2023-04-29 11:26:45,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +24: [2023-04-29 11:26:45,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 11:26:45,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 11:26:45,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 11:26:45,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +23: [2023-04-29 11:26:45,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +34: [2023-04-29 11:26:45,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +15: [2023-04-29 11:26:45,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +15: [2023-04-29 11:26:45,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +26: [2023-04-29 11:26:45,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 11:26:45,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 11:26:45,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 11:26:45,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +14: [2023-04-29 11:26:45,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 11:26:45,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +58: [2023-04-29 11:26:45,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +15: [2023-04-29 11:26:45,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +25: [2023-04-29 11:26:45,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +58: [2023-04-29 11:26:45,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +26: [2023-04-29 11:26:45,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +58: [2023-04-29 11:26:45,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +58: [2023-04-29 11:26:45,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +24: [2023-04-29 11:26:45,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 11:26:45,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 11:26:45,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +58: [2023-04-29 11:26:45,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +58: [2023-04-29 11:26:45,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +58: [2023-04-29 11:26:45,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 11:26:45,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +20: [2023-04-29 11:26:45,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 11:26:45,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 11:26:45,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 11:26:45,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 11:26:45,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +14: [2023-04-29 11:26:45,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +58: [2023-04-29 11:26:45,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +26: [2023-04-29 11:26:45,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +14: [2023-04-29 11:26:45,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 11:26:45,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 11:26:45,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 11:26:45,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 11:26:45,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +26: [2023-04-29 11:26:45,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 11:26:45,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 11:26:45,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +30: [2023-04-29 11:26:45,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 11:26:45,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 11:26:45,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 11:26:45,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 11:26:45,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +48: [2023-04-29 11:26:45,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 11:26:45,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +24: [2023-04-29 11:26:45,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +24: [2023-04-29 11:26:45,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +50: [2023-04-29 11:26:45,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 11:26:45,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +63: [2023-04-29 11:26:45,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +21: [2023-04-29 11:26:45,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 11:26:45,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +16: [2023-04-29 11:26:45,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +26: [2023-04-29 11:26:45,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +63: [2023-04-29 11:26:45,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +24: [2023-04-29 11:26:45,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +26: [2023-04-29 11:26:45,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 11:26:45,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +50: [2023-04-29 11:26:45,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 11:26:45,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +16: [2023-04-29 11:26:45,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +16: [2023-04-29 11:26:45,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 11:26:45,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 3: [2023-04-29 11:26:45,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 5: [2023-04-29 11:26:45,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +30: [2023-04-29 11:26:45,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 11:26:45,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +26: [2023-04-29 11:26:45,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +16: [2023-04-29 11:26:45,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 11:26:45,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 11:26:45,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +34: [2023-04-29 11:26:45,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 11:26:45,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +50: [2023-04-29 11:26:45,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +11: [2023-04-29 11:26:45,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +48: [2023-04-29 11:26:45,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +59: [2023-04-29 11:26:45,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 11:26:45,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 11:26:45,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +48: [2023-04-29 11:26:45,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 11:26:45,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +44: [2023-04-29 11:26:45,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +16: [2023-04-29 11:26:45,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +16: [2023-04-29 11:26:45,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 8: [2023-04-29 11:26:45,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 11:26:45,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 11:26:45,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 3: [2023-04-29 11:26:45,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +59: [2023-04-29 11:26:45,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 11:26:45,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 11:26:45,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 3: [2023-04-29 11:26:45,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +11: [2023-04-29 11:26:45,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +44: [2023-04-29 11:26:45,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 11:26:45,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +22: [2023-04-29 11:26:45,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +11: [2023-04-29 11:26:45,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 8: [2023-04-29 11:26:45,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +44: [2023-04-29 11:26:45,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +44: [2023-04-29 11:26:45,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 11:26:45,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 11:26:45,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 3: [2023-04-29 11:26:45,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 11:26:45,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +47: [2023-04-29 11:26:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 11:26:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 11:26:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 11:26:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 11:26:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 11:26:45,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +28: [2023-04-29 11:26:45,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +28: [2023-04-29 11:26:45,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +31: [2023-04-29 11:26:45,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +31: [2023-04-29 11:26:45,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +31: [2023-04-29 11:26:45,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +50: [2023-04-29 11:26:45,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 11:26:45,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 2: [2023-04-29 11:26:45,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +11: [2023-04-29 11:26:45,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 11:26:45,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 11:26:45,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 11:26:45,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 2: [2023-04-29 11:26:45,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +47: [2023-04-29 11:26:45,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +47: [2023-04-29 11:26:45,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +47: [2023-04-29 11:26:45,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +47: [2023-04-29 11:26:45,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +47: [2023-04-29 11:26:45,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 11:26:45,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +28: [2023-04-29 11:26:45,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +31: [2023-04-29 11:26:45,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 11:26:45,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +47: [2023-04-29 11:26:45,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +31: [2023-04-29 11:26:45,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +29: [2023-04-29 11:26:45,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +29: [2023-04-29 11:26:45,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +29: [2023-04-29 11:26:45,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +29: [2023-04-29 11:26:45,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +47: [2023-04-29 11:26:45,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +44: [2023-04-29 11:26:45,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 11:26:45,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +47: [2023-04-29 11:26:45,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +19: [2023-04-29 11:26:45,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 11:26:45,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 2: [2023-04-29 11:26:45,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +50: [2023-04-29 11:26:45,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +11: [2023-04-29 11:26:45,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +59: [2023-04-29 11:26:45,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +19: [2023-04-29 11:26:45,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +54: [2023-04-29 11:26:45,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +54: [2023-04-29 11:26:45,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +28: [2023-04-29 11:26:45,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +19: [2023-04-29 11:26:45,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 11:26:45,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +23: [2023-04-29 11:26:45,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 11:26:45,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 8: [2023-04-29 11:26:45,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +54: [2023-04-29 11:26:45,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +54: [2023-04-29 11:26:45,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 11:26:45,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +50: [2023-04-29 11:26:45,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +59: [2023-04-29 11:26:45,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +59: [2023-04-29 11:26:45,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +28: [2023-04-29 11:26:45,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +54: [2023-04-29 11:26:45,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +54: [2023-04-29 11:26:45,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 11:26:45,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +22: [2023-04-29 11:26:45,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 11:26:45,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +54: [2023-04-29 11:26:45,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 11:26:45,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 11:26:45,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +23: [2023-04-29 11:26:45,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +22: [2023-04-29 11:26:45,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +30: [2023-04-29 11:26:45,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +30: [2023-04-29 11:26:45,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 8: [2023-04-29 11:26:45,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +20: [2023-04-29 11:26:45,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 11:26:45,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +28: [2023-04-29 11:26:45,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +30: [2023-04-29 11:26:45,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +44: [2023-04-29 11:26:45,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +22: [2023-04-29 11:26:45,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 11:26:45,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 2: [2023-04-29 11:26:45,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +41: [2023-04-29 11:26:45,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 11:26:45,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +26: [2023-04-29 11:26:45,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +14: [2023-04-29 11:26:45,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +41: [2023-04-29 11:26:45,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 11:26:45,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 11:26:45,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 11:26:45,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 11:26:45,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +41: [2023-04-29 11:26:45,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 11:26:45,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 11:26:45,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 11:26:45,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 11:26:45,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +38: [2023-04-29 11:26:45,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +59: [2023-04-29 11:26:45,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 11:26:45,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +38: [2023-04-29 11:26:45,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +38: [2023-04-29 11:26:45,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +38: [2023-04-29 11:26:45,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +38: [2023-04-29 11:26:45,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +38: [2023-04-29 11:26:45,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 11:26:45,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +28: [2023-04-29 11:26:45,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +38: [2023-04-29 11:26:45,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +44: [2023-04-29 11:26:45,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 11:26:45,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +28: [2023-04-29 11:26:45,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +58: [2023-04-29 11:26:45,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 11:26:45,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +41: [2023-04-29 11:26:45,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +41: [2023-04-29 11:26:45,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +26: [2023-04-29 11:26:45,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +41: [2023-04-29 11:26:45,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 11:26:45,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 4: [2023-04-29 11:26:45,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +38: [2023-04-29 11:26:45,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +58: [2023-04-29 11:26:45,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +23: [2023-04-29 11:26:45,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +41: [2023-04-29 11:26:45,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +38: [2023-04-29 11:26:45,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +38: [2023-04-29 11:26:45,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +41: [2023-04-29 11:26:45,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +26: [2023-04-29 11:26:45,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +58: [2023-04-29 11:26:45,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 11:26:45,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 2: [2023-04-29 11:26:45,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 11:26:45,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +38: [2023-04-29 11:26:45,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +38: [2023-04-29 11:26:45,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +26: [2023-04-29 11:26:45,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +38: [2023-04-29 11:26:45,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +38: [2023-04-29 11:26:45,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +14: [2023-04-29 11:26:45,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +38: [2023-04-29 11:26:45,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +11: [2023-04-29 11:26:45,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:45,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 1: [2023-04-29 11:26:45,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +29: [2023-04-29 11:26:45,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 11:26:45,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +14: [2023-04-29 11:26:45,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 11:26:45,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +63: [2023-04-29 11:26:45,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +29: [2023-04-29 11:26:45,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +29: [2023-04-29 11:26:45,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +42: [2023-04-29 11:26:45,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 11:26:45,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 11:26:45,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 11:26:45,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 11:26:45,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 11:26:45,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 11:26:45,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 11:26:45,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +29: [2023-04-29 11:26:45,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +19: [2023-04-29 11:26:45,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +46: [2023-04-29 11:26:45,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 11:26:45,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +19: [2023-04-29 11:26:45,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 11:26:45,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +63: [2023-04-29 11:26:45,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +63: [2023-04-29 11:26:45,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 8: [2023-04-29 11:26:45,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +46: [2023-04-29 11:26:45,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 11:26:45,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +20: [2023-04-29 11:26:45,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +46: [2023-04-29 11:26:45,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 11:26:45,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 11:26:45,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 11:26:45,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +28: [2023-04-29 11:26:45,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 11:26:45,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +42: [2023-04-29 11:26:45,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +42: [2023-04-29 11:26:45,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +42: [2023-04-29 11:26:45,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +11: [2023-04-29 11:26:45,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +63: [2023-04-29 11:26:45,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +63: [2023-04-29 11:26:45,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +20: [2023-04-29 11:26:45,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +42: [2023-04-29 11:26:45,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 5: [2023-04-29 11:26:45,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +42: [2023-04-29 11:26:45,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 5: [2023-04-29 11:26:45,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +17: [2023-04-29 11:26:45,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +17: [2023-04-29 11:26:45,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +42: [2023-04-29 11:26:45,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +42: [2023-04-29 11:26:45,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +10: [2023-04-29 11:26:45,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 11:26:45,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 11:26:45,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +10: [2023-04-29 11:26:45,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 11:26:45,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +46: [2023-04-29 11:26:45,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +14: [2023-04-29 11:26:45,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 11:26:45,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +46: [2023-04-29 11:26:45,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +17: [2023-04-29 11:26:45,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +46: [2023-04-29 11:26:45,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +63: [2023-04-29 11:26:45,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +46: [2023-04-29 11:26:45,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 5: [2023-04-29 11:26:45,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +22: [2023-04-29 11:26:45,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 11:26:45,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 3: [2023-04-29 11:26:45,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 2: [2023-04-29 11:26:45,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +42: [2023-04-29 11:26:45,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 8: [2023-04-29 11:26:45,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +46: [2023-04-29 11:26:45,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +30: [2023-04-29 11:26:45,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +46: [2023-04-29 11:26:45,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +30: [2023-04-29 11:26:45,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +46: [2023-04-29 11:26:45,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +46: [2023-04-29 11:26:45,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +28: [2023-04-29 11:26:45,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:45,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 11:26:45,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 11:26:45,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 11:26:45,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +54: [2023-04-29 11:26:45,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +54: [2023-04-29 11:26:45,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +30: [2023-04-29 11:26:45,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +63: [2023-04-29 11:26:45,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +58: [2023-04-29 11:26:45,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 11:26:45,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +54: [2023-04-29 11:26:45,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +57: [2023-04-29 11:26:45,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 11:26:45,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 11:26:45,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +20: [2023-04-29 11:26:45,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 11:26:45,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 11:26:45,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +58: [2023-04-29 11:26:45,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 11:26:45,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 11:26:45,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 11:26:45,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 11:26:45,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 11:26:45,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 11:26:45,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +22: [2023-04-29 11:26:45,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +57: [2023-04-29 11:26:45,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +58: [2023-04-29 11:26:45,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +26: [2023-04-29 11:26:45,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 11:26:45,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +57: [2023-04-29 11:26:45,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +57: [2023-04-29 11:26:45,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +47: [2023-04-29 11:26:45,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 11:26:45,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +57: [2023-04-29 11:26:45,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +26: [2023-04-29 11:26:45,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 11:26:45,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +57: [2023-04-29 11:26:45,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +57: [2023-04-29 11:26:45,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 11:26:45,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +52: [2023-04-29 11:26:45,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +27: [2023-04-29 11:26:45,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +27: [2023-04-29 11:26:45,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +57: [2023-04-29 11:26:45,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +57: [2023-04-29 11:26:45,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 11:26:45,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +52: [2023-04-29 11:26:45,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +52: [2023-04-29 11:26:45,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +52: [2023-04-29 11:26:45,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +52: [2023-04-29 11:26:45,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +14: [2023-04-29 11:26:45,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +52: [2023-04-29 11:26:45,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +27: [2023-04-29 11:26:45,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +14: [2023-04-29 11:26:45,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 11:26:45,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +14: [2023-04-29 11:26:45,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +43: [2023-04-29 11:26:45,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 11:26:45,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 11:26:45,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 11:26:45,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 11:26:45,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 11:26:45,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +52: [2023-04-29 11:26:45,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 11:26:45,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +52: [2023-04-29 11:26:45,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +47: [2023-04-29 11:26:45,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 11:26:45,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +52: [2023-04-29 11:26:45,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +52: [2023-04-29 11:26:45,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +43: [2023-04-29 11:26:45,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 11:26:45,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +43: [2023-04-29 11:26:45,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 11:26:45,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 11:26:45,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 9: [2023-04-29 11:26:45,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +47: [2023-04-29 11:26:45,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +52: [2023-04-29 11:26:45,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +43: [2023-04-29 11:26:45,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 11:26:45,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +31: [2023-04-29 11:26:45,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +31: [2023-04-29 11:26:45,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +43: [2023-04-29 11:26:45,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 9: [2023-04-29 11:26:45,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +17: [2023-04-29 11:26:45,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 11:26:45,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 11:26:45,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 11:26:45,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 11:26:45,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 11:26:45,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 11:26:45,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +56: [2023-04-29 11:26:45,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 11:26:45,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 11:26:45,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 11:26:45,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 11:26:45,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 11:26:45,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 11:26:45,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +56: [2023-04-29 11:26:45,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +54: [2023-04-29 11:26:45,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 11:26:45,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 11:26:45,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 11:26:45,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 11:26:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 11:26:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 11:26:45,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +29: [2023-04-29 11:26:45,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +55: [2023-04-29 11:26:45,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +54: [2023-04-29 11:26:45,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 11:26:45,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 11:26:45,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 11:26:45,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +31: [2023-04-29 11:26:45,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +31: [2023-04-29 11:26:45,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +31: [2023-04-29 11:26:45,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +51: [2023-04-29 11:26:45,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 11:26:45,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 11:26:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +39: [2023-04-29 11:26:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 11:26:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 11:26:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 11:26:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +62: [2023-04-29 11:26:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +31: [2023-04-29 11:26:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 5: [2023-04-29 11:26:45,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +51: [2023-04-29 11:26:45,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 11:26:45,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +14: [2023-04-29 11:26:45,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +14: [2023-04-29 11:26:45,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +27: [2023-04-29 11:26:45,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 11:26:45,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +51: [2023-04-29 11:26:45,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +29: [2023-04-29 11:26:45,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +27: [2023-04-29 11:26:45,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +55: [2023-04-29 11:26:45,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 11:26:45,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +55: [2023-04-29 11:26:45,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 11:26:45,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 11:26:45,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 11:26:45,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +27: [2023-04-29 11:26:45,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 11:26:45,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 11:26:45,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +62: [2023-04-29 11:26:45,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 11:26:45,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 11:26:45,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +39: [2023-04-29 11:26:45,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 11:26:45,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 11:26:45,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +51: [2023-04-29 11:26:45,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 4: [2023-04-29 11:26:45,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 4: [2023-04-29 11:26:45,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +38: [2023-04-29 11:26:45,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +51: [2023-04-29 11:26:45,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 11:26:45,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +39: [2023-04-29 11:26:45,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 11:26:45,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +39: [2023-04-29 11:26:45,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 11:26:45,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 11:26:45,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 11:26:45,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 11:26:45,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 11:26:45,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 11:26:45,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 11:26:45,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +22: [2023-04-29 11:26:45,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +22: [2023-04-29 11:26:45,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +22: [2023-04-29 11:26:45,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +22: [2023-04-29 11:26:45,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +62: [2023-04-29 11:26:45,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 11:26:45,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 11:26:45,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 11:26:45,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +39: [2023-04-29 11:26:45,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 11:26:45,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +30: [2023-04-29 11:26:45,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +42: [2023-04-29 11:26:45,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +47: [2023-04-29 11:26:45,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +47: [2023-04-29 11:26:45,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 11:26:45,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +31: [2023-04-29 11:26:45,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +31: [2023-04-29 11:26:45,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +60: [2023-04-29 11:26:45,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 11:26:45,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 11:26:45,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +29: [2023-04-29 11:26:45,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +29: [2023-04-29 11:26:45,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +38: [2023-04-29 11:26:45,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +30: [2023-04-29 11:26:45,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +47: [2023-04-29 11:26:45,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 5: [2023-04-29 11:26:45,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +10: [2023-04-29 11:26:45,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +35: [2023-04-29 11:26:45,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 11:26:45,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 11:26:45,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 11:26:45,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +30: [2023-04-29 11:26:45,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 11:26:45,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +18: [2023-04-29 11:26:45,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +35: [2023-04-29 11:26:45,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 11:26:45,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 11:26:45,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 11:26:45,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 11:26:45,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +18: [2023-04-29 11:26:45,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +30: [2023-04-29 11:26:45,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 6: [2023-04-29 11:26:45,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +31: [2023-04-29 11:26:45,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +54: [2023-04-29 11:26:45,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +29: [2023-04-29 11:26:45,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +10: [2023-04-29 11:26:45,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 11:26:45,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +62: [2023-04-29 11:26:45,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +62: [2023-04-29 11:26:45,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +62: [2023-04-29 11:26:45,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +62: [2023-04-29 11:26:45,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +41: [2023-04-29 11:26:45,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 11:26:45,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +38: [2023-04-29 11:26:45,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +61: [2023-04-29 11:26:45,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +61: [2023-04-29 11:26:45,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +61: [2023-04-29 11:26:45,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +30: [2023-04-29 11:26:45,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +61: [2023-04-29 11:26:45,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. + 5: [2023-04-29 11:26:45,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... + 5: [2023-04-29 11:26:45,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +41: [2023-04-29 11:26:45,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +54: [2023-04-29 11:26:45,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +14: [2023-04-29 11:26:45,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +35: [2023-04-29 11:26:45,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +35: [2023-04-29 11:26:45,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +35: [2023-04-29 11:26:45,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +35: [2023-04-29 11:26:45,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 6: [2023-04-29 11:26:45,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +30: [2023-04-29 11:26:45,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +35: [2023-04-29 11:26:45,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +42: [2023-04-29 11:26:45,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +42: [2023-04-29 11:26:45,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +30: [2023-04-29 11:26:45,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +41: [2023-04-29 11:26:45,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +41: [2023-04-29 11:26:45,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 11:26:45,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +14: [2023-04-29 11:26:45,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +14: [2023-04-29 11:26:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 11:26:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +54: [2023-04-29 11:26:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +35: [2023-04-29 11:26:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +35: [2023-04-29 11:26:45,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 5: [2023-04-29 11:26:45,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +13: [2023-04-29 11:26:45,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +13: [2023-04-29 11:26:45,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +13: [2023-04-29 11:26:45,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +13: [2023-04-29 11:26:45,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +35: [2023-04-29 11:26:45,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +31: [2023-04-29 11:26:45,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 11:26:45,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +14: [2023-04-29 11:26:45,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 11:26:45,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +31: [2023-04-29 11:26:45,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +10: [2023-04-29 11:26:45,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +38: [2023-04-29 11:26:45,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 11:26:45,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 11:26:45,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 11:26:45,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 11:26:45,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +22: [2023-04-29 11:26:45,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +57: [2023-04-29 11:26:45,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 11:26:45,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +57: [2023-04-29 11:26:45,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 11:26:45,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +46: [2023-04-29 11:26:45,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +10: [2023-04-29 11:26:45,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +43: [2023-04-29 11:26:45,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 11:26:45,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 11:26:45,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +52: [2023-04-29 11:26:45,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +46: [2023-04-29 11:26:45,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 11:26:45,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 11:26:45,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 11:26:45,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 11:26:45,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +43: [2023-04-29 11:26:45,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 11:26:45,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +22: [2023-04-29 11:26:45,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +22: [2023-04-29 11:26:45,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +17: [2023-04-29 11:26:45,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +17: [2023-04-29 11:26:45,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 11:26:45,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 11:26:45,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +25: [2023-04-29 11:26:45,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +25: [2023-04-29 11:26:45,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +25: [2023-04-29 11:26:45,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +61: [2023-04-29 11:26:45,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 11:26:45,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +18: [2023-04-29 11:26:45,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 11:26:45,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 11:26:45,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 11:26:45,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +62: [2023-04-29 11:26:45,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +18: [2023-04-29 11:26:45,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +57: [2023-04-29 11:26:45,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 11:26:45,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +62: [2023-04-29 11:26:45,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 11:26:45,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +56: [2023-04-29 11:26:45,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +61: [2023-04-29 11:26:45,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 11:26:45,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 11:26:45,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +62: [2023-04-29 11:26:45,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 11:26:45,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +61: [2023-04-29 11:26:45,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +61: [2023-04-29 11:26:45,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 11:26:45,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 11:26:45,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 11:26:45,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 11:26:45,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 11:26:45,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 11:26:45,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 11:26:45,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +54: [2023-04-29 11:26:45,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +36: [2023-04-29 11:26:45,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 11:26:45,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 11:26:45,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 11:26:45,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +10: [2023-04-29 11:26:45,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +54: [2023-04-29 11:26:45,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +13: [2023-04-29 11:26:45,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +57: [2023-04-29 11:26:45,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 11:26:45,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +13: [2023-04-29 11:26:45,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 11:26:45,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +55: [2023-04-29 11:26:45,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 11:26:45,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 11:26:45,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +12: [2023-04-29 11:26:45,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +12: [2023-04-29 11:26:45,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +51: [2023-04-29 11:26:45,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 11:26:45,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 11:26:45,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +19: [2023-04-29 11:26:45,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +19: [2023-04-29 11:26:45,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +36: [2023-04-29 11:26:45,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +12: [2023-04-29 11:26:45,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +13: [2023-04-29 11:26:45,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +12: [2023-04-29 11:26:45,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +43: [2023-04-29 11:26:45,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +52: [2023-04-29 11:26:45,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 11:26:45,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +19: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +49: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +19: [2023-04-29 11:26:45,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +54: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +54: [2023-04-29 11:26:45,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 11:26:45,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +10: [2023-04-29 11:26:45,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +55: [2023-04-29 11:26:45,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 11:26:45,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +27: [2023-04-29 11:26:45,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +43: [2023-04-29 11:26:45,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 11:26:45,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 11:26:45,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +49: [2023-04-29 11:26:45,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +49: [2023-04-29 11:26:45,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +39: [2023-04-29 11:26:45,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 11:26:45,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +60: [2023-04-29 11:26:45,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 11:26:45,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +27: [2023-04-29 11:26:45,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +27: [2023-04-29 11:26:45,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +54: [2023-04-29 11:26:45,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 9: [2023-04-29 11:26:45,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 11:26:45,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +54: [2023-04-29 11:26:45,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +52: [2023-04-29 11:26:45,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 11:26:45,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 11:26:45,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +20: [2023-04-29 11:26:45,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +20: [2023-04-29 11:26:45,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +49: [2023-04-29 11:26:45,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +20: [2023-04-29 11:26:45,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +20: [2023-04-29 11:26:45,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_09-model_01-model_states.pt. +56: [2023-04-29 11:26:45,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 11:26:45,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +49: [2023-04-29 11:26:45,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +25: [2023-04-29 11:26:45,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +27: [2023-04-29 11:26:45,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +49: [2023-04-29 11:26:45,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +27: [2023-04-29 11:26:45,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +14: [2023-04-29 11:26:45,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +51: [2023-04-29 11:26:45,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +62: [2023-04-29 11:26:45,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 11:26:45,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 11:26:45,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 11:26:45,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +51: [2023-04-29 11:26:45,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +27: [2023-04-29 11:26:45,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 9: [2023-04-29 11:26:45,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +56: [2023-04-29 11:26:45,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 11:26:45,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +25: [2023-04-29 11:26:45,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 11:26:45,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 11:26:45,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +62: [2023-04-29 11:26:45,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 11:26:45,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 9: [2023-04-29 11:26:45,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 9: [2023-04-29 11:26:45,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +27: [2023-04-29 11:26:45,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 11:26:45,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +56: [2023-04-29 11:26:45,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 11:26:45,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 9: [2023-04-29 11:26:45,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 9: [2023-04-29 11:26:45,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 6: [2023-04-29 11:26:45,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +62: [2023-04-29 11:26:45,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +31: [2023-04-29 11:26:45,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +35: [2023-04-29 11:26:45,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +60: [2023-04-29 11:26:45,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +21: [2023-04-29 11:26:45,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +21: [2023-04-29 11:26:45,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +21: [2023-04-29 11:26:45,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +21: [2023-04-29 11:26:45,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +62: [2023-04-29 11:26:45,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +12: [2023-04-29 11:26:45,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +51: [2023-04-29 11:26:45,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 3: [2023-04-29 11:26:45,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +12: [2023-04-29 11:26:45,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +55: [2023-04-29 11:26:45,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +31: [2023-04-29 11:26:45,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +14: [2023-04-29 11:26:45,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +12: [2023-04-29 11:26:45,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +55: [2023-04-29 11:26:45,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 11:26:45,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 11:26:45,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +35: [2023-04-29 11:26:45,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +35: [2023-04-29 11:26:45,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +19: [2023-04-29 11:26:45,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 11:26:45,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 11:26:45,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +19: [2023-04-29 11:26:45,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 11:26:45,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +39: [2023-04-29 11:26:45,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 11:26:45,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +31: [2023-04-29 11:26:45,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +31: [2023-04-29 11:26:45,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +51: [2023-04-29 11:26:45,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +12: [2023-04-29 11:26:45,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +14: [2023-04-29 11:26:45,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +14: [2023-04-29 11:26:45,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 11:26:45,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 6: [2023-04-29 11:26:45,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +19: [2023-04-29 11:26:45,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 11:26:45,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +10: [2023-04-29 11:26:45,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +10: [2023-04-29 11:26:45,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 6: [2023-04-29 11:26:45,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +35: [2023-04-29 11:26:45,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +10: [2023-04-29 11:26:45,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +22: [2023-04-29 11:26:45,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 0: [2023-04-29 11:26:45,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +39: [2023-04-29 11:26:45,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 6: [2023-04-29 11:26:45,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +60: [2023-04-29 11:26:45,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +60: [2023-04-29 11:26:45,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 11:26:45,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +20: [2023-04-29 11:26:45,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... +14: [2023-04-29 11:26:45,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 7: [2023-04-29 11:26:45,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:45,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 11:26:45,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +11: [2023-04-29 11:26:45,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +11: [2023-04-29 11:26:45,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 7: [2023-04-29 11:26:45,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +31: [2023-04-29 11:26:45,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +31: [2023-04-29 11:26:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +39: [2023-04-29 11:26:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +11: [2023-04-29 11:26:45,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +62: [2023-04-29 11:26:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +14: [2023-04-29 11:26:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +31: [2023-04-29 11:26:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +39: [2023-04-29 11:26:45,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +63: [2023-04-29 11:26:45,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 11:26:45,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 11:26:45,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +62: [2023-04-29 11:26:45,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +22: [2023-04-29 11:26:45,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +63: [2023-04-29 11:26:45,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 11:26:45,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +22: [2023-04-29 11:26:45,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 4: [2023-04-29 11:26:45,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +51: [2023-04-29 11:26:45,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +20: [2023-04-29 11:26:45,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:45,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +60: [2023-04-29 11:26:45,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 11:26:45,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 7: [2023-04-29 11:26:45,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +63: [2023-04-29 11:26:45,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +22: [2023-04-29 11:26:45,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 4: [2023-04-29 11:26:45,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +63: [2023-04-29 11:26:45,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 11:26:45,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +62: [2023-04-29 11:26:45,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 11:26:45,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +22: [2023-04-29 11:26:45,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +15: [2023-04-29 11:26:45,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +35: [2023-04-29 11:26:45,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +15: [2023-04-29 11:26:45,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +15: [2023-04-29 11:26:45,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +15: [2023-04-29 11:26:45,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +28: [2023-04-29 11:26:45,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +28: [2023-04-29 11:26:45,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +21: [2023-04-29 11:26:45,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 4: [2023-04-29 11:26:45,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +62: [2023-04-29 11:26:45,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +28: [2023-04-29 11:26:45,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +28: [2023-04-29 11:26:45,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +60: [2023-04-29 11:26:45,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +22: [2023-04-29 11:26:45,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 3: [2023-04-29 11:26:45,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 11:26:45,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 11:26:45,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +21: [2023-04-29 11:26:45,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 3: [2023-04-29 11:26:45,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 0: [2023-04-29 11:26:45,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +10: [2023-04-29 11:26:45,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +36: [2023-04-29 11:26:45,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 11:26:45,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 11:26:45,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 11:26:45,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 11:26:45,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 11:26:45,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 7: [2023-04-29 11:26:45,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 7: [2023-04-29 11:26:45,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 7: [2023-04-29 11:26:45,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 7: [2023-04-29 11:26:45,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +32: [2023-04-29 11:26:45,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +32: [2023-04-29 11:26:45,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. + 6: [2023-04-29 11:26:45,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +32: [2023-04-29 11:26:45,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +10: [2023-04-29 11:26:45,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +32: [2023-04-29 11:26:45,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +62: [2023-04-29 11:26:45,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +62: [2023-04-29 11:26:45,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 3: [2023-04-29 11:26:45,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +62: [2023-04-29 11:26:45,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +10: [2023-04-29 11:26:45,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 11:26:45,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +49: [2023-04-29 11:26:45,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 11:26:45,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 11:26:45,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 11:26:45,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 11:26:45,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +35: [2023-04-29 11:26:46,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 11:26:46,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +62: [2023-04-29 11:26:46,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +11: [2023-04-29 11:26:46,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +62: [2023-04-29 11:26:46,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +62: [2023-04-29 11:26:46,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +36: [2023-04-29 11:26:46,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 11:26:46,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 11:26:46,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +13: [2023-04-29 11:26:46,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 11:26:46,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 11:26:46,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 11:26:46,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +13: [2023-04-29 11:26:46,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +11: [2023-04-29 11:26:46,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +13: [2023-04-29 11:26:46,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +15: [2023-04-29 11:26:46,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 11:26:46,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +25: [2023-04-29 11:26:46,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 11:26:46,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +25: [2023-04-29 11:26:46,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +25: [2023-04-29 11:26:46,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +49: [2023-04-29 11:26:46,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +49: [2023-04-29 11:26:46,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +15: [2023-04-29 11:26:46,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +60: [2023-04-29 11:26:46,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +60: [2023-04-29 11:26:46,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +60: [2023-04-29 11:26:46,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +60: [2023-04-29 11:26:46,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +49: [2023-04-29 11:26:46,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +28: [2023-04-29 11:26:46,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 11:26:46,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 11:26:46,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +28: [2023-04-29 11:26:46,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +25: [2023-04-29 11:26:46,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +36: [2023-04-29 11:26:46,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +15: [2023-04-29 11:26:46,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 11:26:46,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +15: [2023-04-29 11:26:46,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 11:26:46,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 1: [2023-04-29 11:26:46,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +49: [2023-04-29 11:26:46,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +19: [2023-04-29 11:26:46,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 11:26:46,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 11:26:46,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 11:26:46,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 11:26:46,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 11:26:46,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 11:26:46,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 11:26:46,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 11:26:46,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +16: [2023-04-29 11:26:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 11:26:46,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 11:26:46,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +24: [2023-04-29 11:26:46,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +36: [2023-04-29 11:26:46,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +24: [2023-04-29 11:26:46,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +29: [2023-04-29 11:26:46,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 11:26:46,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 11:26:46,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +36: [2023-04-29 11:26:46,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 11:26:46,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 11:26:46,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +24: [2023-04-29 11:26:46,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +29: [2023-04-29 11:26:46,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 11:26:46,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 11:26:46,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 11:26:46,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 11:26:46,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +36: [2023-04-29 11:26:46,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +16: [2023-04-29 11:26:46,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +16: [2023-04-29 11:26:46,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +19: [2023-04-29 11:26:46,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 11:26:46,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:46,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:46,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +32: [2023-04-29 11:26:46,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 11:26:46,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +60: [2023-04-29 11:26:46,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +19: [2023-04-29 11:26:46,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +49: [2023-04-29 11:26:46,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 11:26:46,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +53: [2023-04-29 11:26:46,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +53: [2023-04-29 11:26:46,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +60: [2023-04-29 11:26:46,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 11:26:46,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +60: [2023-04-29 11:26:46,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 11:26:46,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 11:26:46,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 11:26:46,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +21: [2023-04-29 11:26:46,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +49: [2023-04-29 11:26:46,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +32: [2023-04-29 11:26:46,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +19: [2023-04-29 11:26:46,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +20: [2023-04-29 11:26:46,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_00-model_states.pt. +49: [2023-04-29 11:26:46,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +18: [2023-04-29 11:26:46,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 11:26:46,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 11:26:46,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 11:26:46,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 11:26:46,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 11:26:46,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 11:26:46,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 11:26:46,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +63: [2023-04-29 11:26:46,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 11:26:46,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 11:26:46,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 11:26:46,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +21: [2023-04-29 11:26:46,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +18: [2023-04-29 11:26:46,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 11:26:46,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +24: [2023-04-29 11:26:46,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +24: [2023-04-29 11:26:46,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +24: [2023-04-29 11:26:46,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +20: [2023-04-29 11:26:46,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt... +18: [2023-04-29 11:26:46,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 11:26:46,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +18: [2023-04-29 11:26:46,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +10: [2023-04-29 11:26:46,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 11:26:46,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 11:26:46,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +18: [2023-04-29 11:26:46,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 0: [2023-04-29 11:26:46,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 0: [2023-04-29 11:26:46,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +21: [2023-04-29 11:26:46,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +18: [2023-04-29 11:26:46,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 11:26:46,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 0: [2023-04-29 11:26:46,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 3: [2023-04-29 11:26:46,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 3: [2023-04-29 11:26:46,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 11:26:46,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +11: [2023-04-29 11:26:46,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 11:26:46,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +21: [2023-04-29 11:26:46,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 3: [2023-04-29 11:26:46,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +21: [2023-04-29 11:26:46,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 11:26:46,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 11:26:46,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 11:26:46,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +63: [2023-04-29 11:26:46,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 11:26:46,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 11:26:46,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +53: [2023-04-29 11:26:46,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 11:26:46,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +28: [2023-04-29 11:26:46,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 11:26:46,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +10: [2023-04-29 11:26:46,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 11:26:46,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +53: [2023-04-29 11:26:46,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 11:26:46,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 3: [2023-04-29 11:26:46,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 7: [2023-04-29 11:26:46,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 11:26:46,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +28: [2023-04-29 11:26:46,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +23: [2023-04-29 11:26:46,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +23: [2023-04-29 11:26:46,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +23: [2023-04-29 11:26:46,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +10: [2023-04-29 11:26:46,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +10: [2023-04-29 11:26:46,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 3: [2023-04-29 11:26:46,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +33: [2023-04-29 11:26:46,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +33: [2023-04-29 11:26:46,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +33: [2023-04-29 11:26:46,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +33: [2023-04-29 11:26:46,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +63: [2023-04-29 11:26:46,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 11:26:46,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 6: [2023-04-29 11:26:46,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 6: [2023-04-29 11:26:46,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 5: [2023-04-29 11:26:46,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 5: [2023-04-29 11:26:46,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 5: [2023-04-29 11:26:46,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 5: [2023-04-29 11:26:46,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +28: [2023-04-29 11:26:46,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +63: [2023-04-29 11:26:46,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 11:26:46,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +23: [2023-04-29 11:26:46,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +11: [2023-04-29 11:26:46,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +11: [2023-04-29 11:26:46,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 11:26:46,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +28: [2023-04-29 11:26:46,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 11:26:46,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +24: [2023-04-29 11:26:46,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 11:26:46,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 11:26:46,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +61: [2023-04-29 11:26:46,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +28: [2023-04-29 11:26:46,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +61: [2023-04-29 11:26:46,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 11:26:46,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 11:26:46,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 11:26:46,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 11:26:46,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 11:26:46,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 11:26:46,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +28: [2023-04-29 11:26:46,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... + 0: [2023-04-29 11:26:46,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 11:26:46,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +11: [2023-04-29 11:26:46,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +27: [2023-04-29 11:26:46,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 11:26:46,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 11:26:46,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 11:26:46,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 11:26:46,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +61: [2023-04-29 11:26:46,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +11: [2023-04-29 11:26:46,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +13: [2023-04-29 11:26:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 11:26:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 11:26:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +61: [2023-04-29 11:26:46,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +13: [2023-04-29 11:26:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +61: [2023-04-29 11:26:46,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +61: [2023-04-29 11:26:46,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +61: [2023-04-29 11:26:46,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 11:26:46,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +61: [2023-04-29 11:26:46,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +61: [2023-04-29 11:26:46,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +61: [2023-04-29 11:26:46,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +27: [2023-04-29 11:26:46,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 11:26:46,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 11:26:46,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 11:26:46,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 11:26:46,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 11:26:46,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 11:26:46,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 11:26:46,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +23: [2023-04-29 11:26:46,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 11:26:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 11:26:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +37: [2023-04-29 11:26:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +37: [2023-04-29 11:26:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +16: [2023-04-29 11:26:46,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 11:26:46,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +16: [2023-04-29 11:26:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +16: [2023-04-29 11:26:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +16: [2023-04-29 11:26:46,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 11:26:46,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 7: [2023-04-29 11:26:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 11:26:46,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +33: [2023-04-29 11:26:46,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 11:26:46,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 11:26:46,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +37: [2023-04-29 11:26:46,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +16: [2023-04-29 11:26:46,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +33: [2023-04-29 11:26:46,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 11:26:46,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 11:26:46,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +33: [2023-04-29 11:26:46,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +33: [2023-04-29 11:26:46,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +15: [2023-04-29 11:26:46,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 11:26:46,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 11:26:46,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 11:26:46,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 11:26:46,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 11:26:46,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 11:26:46,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 11:26:46,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 11:26:46,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 11:26:46,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +60: [2023-04-29 11:26:46,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 5: [2023-04-29 11:26:46,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +60: [2023-04-29 11:26:46,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +21: [2023-04-29 11:26:46,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 11:26:46,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 11:26:46,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 11:26:46,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +60: [2023-04-29 11:26:46,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +60: [2023-04-29 11:26:46,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +18: [2023-04-29 11:26:46,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 11:26:46,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 11:26:46,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 11:26:46,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 11:26:46,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +15: [2023-04-29 11:26:46,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +15: [2023-04-29 11:26:46,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 11:26:46,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 11:26:46,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +60: [2023-04-29 11:26:46,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +21: [2023-04-29 11:26:46,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +60: [2023-04-29 11:26:46,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +21: [2023-04-29 11:26:46,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 11:26:46,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +29: [2023-04-29 11:26:46,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +60: [2023-04-29 11:26:46,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +15: [2023-04-29 11:26:46,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +15: [2023-04-29 11:26:46,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +15: [2023-04-29 11:26:46,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +15: [2023-04-29 11:26:46,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 7: [2023-04-29 11:26:46,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +16: [2023-04-29 11:26:46,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 11:26:46,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +18: [2023-04-29 11:26:46,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 11:26:46,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 11:26:46,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +18: [2023-04-29 11:26:46,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +37: [2023-04-29 11:26:46,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +51: [2023-04-29 11:26:46,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +51: [2023-04-29 11:26:46,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +51: [2023-04-29 11:26:46,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +51: [2023-04-29 11:26:46,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +23: [2023-04-29 11:26:46,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 11:26:46,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 11:26:46,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 11:26:46,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 11:26:46,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 11:26:46,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +37: [2023-04-29 11:26:46,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +48: [2023-04-29 11:26:46,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +48: [2023-04-29 11:26:46,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +25: [2023-04-29 11:26:46,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +48: [2023-04-29 11:26:46,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +25: [2023-04-29 11:26:46,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +48: [2023-04-29 11:26:46,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +23: [2023-04-29 11:26:46,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +37: [2023-04-29 11:26:46,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 11:26:46,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 11:26:46,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 11:26:46,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 11:26:46,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 11:26:46,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 11:26:46,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +33: [2023-04-29 11:26:46,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +16: [2023-04-29 11:26:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 11:26:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 11:26:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 11:26:46,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 11:26:46,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 11:26:46,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +25: [2023-04-29 11:26:46,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +33: [2023-04-29 11:26:46,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 11:26:46,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 11:26:46,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:46,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 11:26:46,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 11:26:46,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 11:26:46,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 11:26:46,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 11:26:46,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 11:26:46,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 11:26:46,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 11:26:46,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 11:26:46,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 11:26:46,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 11:26:46,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 11:26:46,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 11:26:46,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +16: [2023-04-29 11:26:46,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 11:26:46,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 11:26:46,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +23: [2023-04-29 11:26:46,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 11:26:46,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +30: [2023-04-29 11:26:46,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 11:26:46,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 11:26:46,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 11:26:46,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +30: [2023-04-29 11:26:46,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 11:26:46,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +12: [2023-04-29 11:26:46,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +19: [2023-04-29 11:26:46,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 11:26:46,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 11:26:46,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +12: [2023-04-29 11:26:46,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +24: [2023-04-29 11:26:46,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +19: [2023-04-29 11:26:46,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +16: [2023-04-29 11:26:46,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +19: [2023-04-29 11:26:46,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 11:26:46,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +61: [2023-04-29 11:26:46,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +12: [2023-04-29 11:26:46,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +12: [2023-04-29 11:26:46,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +12: [2023-04-29 11:26:46,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 11:26:46,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 11:26:46,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +16: [2023-04-29 11:26:46,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 11:26:46,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 11:26:46,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +17: [2023-04-29 11:26:46,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +17: [2023-04-29 11:26:46,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 11:26:46,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 11:26:46,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 11:26:46,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +18: [2023-04-29 11:26:46,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 11:26:46,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 11:26:46,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 11:26:46,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 11:26:46,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 11:26:46,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 11:26:46,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +27: [2023-04-29 11:26:46,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 11:26:46,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +34: [2023-04-29 11:26:46,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +34: [2023-04-29 11:26:46,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +34: [2023-04-29 11:26:46,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +17: [2023-04-29 11:26:46,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +34: [2023-04-29 11:26:46,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +51: [2023-04-29 11:26:46,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 11:26:46,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 11:26:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 11:26:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 11:26:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 11:26:46,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +13: [2023-04-29 11:26:46,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +17: [2023-04-29 11:26:46,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +51: [2023-04-29 11:26:46,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +61: [2023-04-29 11:26:46,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 11:26:46,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +32: [2023-04-29 11:26:46,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +48: [2023-04-29 11:26:46,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +27: [2023-04-29 11:26:46,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 11:26:46,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 11:26:46,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 11:26:46,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +48: [2023-04-29 11:26:46,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +48: [2023-04-29 11:26:46,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 11:26:46,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 11:26:46,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 11:26:46,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 11:26:46,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +44: [2023-04-29 11:26:46,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +44: [2023-04-29 11:26:46,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +61: [2023-04-29 11:26:46,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +11: [2023-04-29 11:26:46,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +45: [2023-04-29 11:26:46,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +45: [2023-04-29 11:26:46,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +45: [2023-04-29 11:26:46,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +44: [2023-04-29 11:26:46,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +45: [2023-04-29 11:26:46,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +44: [2023-04-29 11:26:46,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +11: [2023-04-29 11:26:46,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 11:26:46,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +32: [2023-04-29 11:26:46,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +32: [2023-04-29 11:26:46,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +40: [2023-04-29 11:26:46,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 11:26:46,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 11:26:46,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 11:26:46,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 11:26:46,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +32: [2023-04-29 11:26:46,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 11:26:46,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 11:26:46,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 11:26:46,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 11:26:46,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 11:26:46,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 11:26:46,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +33: [2023-04-29 11:26:46,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +21: [2023-04-29 11:26:46,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +32: [2023-04-29 11:26:46,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +32: [2023-04-29 11:26:46,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +11: [2023-04-29 11:26:46,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 5: [2023-04-29 11:26:46,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +53: [2023-04-29 11:26:46,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 11:26:46,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 11:26:46,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 11:26:46,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 11:26:46,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 11:26:46,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 11:26:46,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 11:26:46,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +53: [2023-04-29 11:26:46,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +24: [2023-04-29 11:26:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +24: [2023-04-29 11:26:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +40: [2023-04-29 11:26:46,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +24: [2023-04-29 11:26:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 11:26:46,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 11:26:46,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +40: [2023-04-29 11:26:46,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +13: [2023-04-29 11:26:46,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +23: [2023-04-29 11:26:46,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +23: [2023-04-29 11:26:46,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +23: [2023-04-29 11:26:46,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +23: [2023-04-29 11:26:46,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +40: [2023-04-29 11:26:46,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 11:26:46,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +27: [2023-04-29 11:26:46,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 11:26:46,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +53: [2023-04-29 11:26:46,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +40: [2023-04-29 11:26:46,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 11:26:46,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 5: [2023-04-29 11:26:46,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +53: [2023-04-29 11:26:46,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 11:26:46,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 11:26:46,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 11:26:46,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +13: [2023-04-29 11:26:46,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 11:26:46,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +53: [2023-04-29 11:26:46,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 11:26:46,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +15: [2023-04-29 11:26:46,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +15: [2023-04-29 11:26:46,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +53: [2023-04-29 11:26:46,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +53: [2023-04-29 11:26:46,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +24: [2023-04-29 11:26:46,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +24: [2023-04-29 11:26:46,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +24: [2023-04-29 11:26:46,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 5: [2023-04-29 11:26:46,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +34: [2023-04-29 11:26:46,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 11:26:46,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +61: [2023-04-29 11:26:46,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +33: [2023-04-29 11:26:46,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +33: [2023-04-29 11:26:46,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +61: [2023-04-29 11:26:46,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +45: [2023-04-29 11:26:46,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +45: [2023-04-29 11:26:46,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +13: [2023-04-29 11:26:46,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 11:26:46,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 1: [2023-04-29 11:26:46,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +34: [2023-04-29 11:26:46,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 8: [2023-04-29 11:26:46,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 8: [2023-04-29 11:26:46,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +45: [2023-04-29 11:26:46,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 1: [2023-04-29 11:26:46,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +45: [2023-04-29 11:26:46,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +33: [2023-04-29 11:26:46,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +25: [2023-04-29 11:26:46,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 11:26:46,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +45: [2023-04-29 11:26:46,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 11:26:46,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +45: [2023-04-29 11:26:46,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +27: [2023-04-29 11:26:46,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 11:26:46,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 11:26:46,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +40: [2023-04-29 11:26:46,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +48: [2023-04-29 11:26:46,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +48: [2023-04-29 11:26:46,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +48: [2023-04-29 11:26:46,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +48: [2023-04-29 11:26:46,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 11:26:46,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +44: [2023-04-29 11:26:46,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +33: [2023-04-29 11:26:46,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +33: [2023-04-29 11:26:46,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +44: [2023-04-29 11:26:46,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +45: [2023-04-29 11:26:46,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +40: [2023-04-29 11:26:46,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. + 3: [2023-04-29 11:26:46,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +45: [2023-04-29 11:26:46,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +16: [2023-04-29 11:26:46,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +61: [2023-04-29 11:26:46,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +33: [2023-04-29 11:26:46,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +44: [2023-04-29 11:26:46,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +44: [2023-04-29 11:26:46,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +45: [2023-04-29 11:26:46,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +45: [2023-04-29 11:26:46,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 11:26:46,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +43: [2023-04-29 11:26:46,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +43: [2023-04-29 11:26:46,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +21: [2023-04-29 11:26:46,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:46,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 11:26:46,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +45: [2023-04-29 11:26:46,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +36: [2023-04-29 11:26:46,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +36: [2023-04-29 11:26:46,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +48: [2023-04-29 11:26:46,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 11:26:46,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +59: [2023-04-29 11:26:46,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +59: [2023-04-29 11:26:46,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +12: [2023-04-29 11:26:46,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +48: [2023-04-29 11:26:46,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 11:26:46,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +25: [2023-04-29 11:26:46,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +36: [2023-04-29 11:26:46,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +45: [2023-04-29 11:26:46,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +23: [2023-04-29 11:26:46,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +59: [2023-04-29 11:26:46,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. + 3: [2023-04-29 11:26:46,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +16: [2023-04-29 11:26:46,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +48: [2023-04-29 11:26:46,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +59: [2023-04-29 11:26:46,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +15: [2023-04-29 11:26:46,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 11:26:46,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 11:26:46,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 11:26:46,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 11:26:46,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 11:26:46,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 11:26:46,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 11:26:46,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 11:26:46,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 11:26:46,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +16: [2023-04-29 11:26:46,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 11:26:46,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 11:26:46,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 11:26:46,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 11:26:46,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 11:26:46,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 11:26:46,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 11:26:46,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +14: [2023-04-29 11:26:46,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 11:26:46,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 11:26:46,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 11:26:46,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 11:26:46,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 11:26:46,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 11:26:46,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +10: [2023-04-29 11:26:46,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 11:26:46,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 11:26:46,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 11:26:46,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +50: [2023-04-29 11:26:46,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 11:26:46,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 11:26:46,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +12: [2023-04-29 11:26:46,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +17: [2023-04-29 11:26:46,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +50: [2023-04-29 11:26:46,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +25: [2023-04-29 11:26:46,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +14: [2023-04-29 11:26:46,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +14: [2023-04-29 11:26:46,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 11:26:46,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +55: [2023-04-29 11:26:46,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +55: [2023-04-29 11:26:46,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +12: [2023-04-29 11:26:46,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 11:26:46,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +29: [2023-04-29 11:26:46,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +29: [2023-04-29 11:26:46,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +16: [2023-04-29 11:26:46,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +51: [2023-04-29 11:26:46,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 11:26:46,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +10: [2023-04-29 11:26:46,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +10: [2023-04-29 11:26:46,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +29: [2023-04-29 11:26:46,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +14: [2023-04-29 11:26:46,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:46,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +55: [2023-04-29 11:26:46,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +55: [2023-04-29 11:26:46,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +14: [2023-04-29 11:26:46,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 11:26:46,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 11:26:46,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +33: [2023-04-29 11:26:46,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +28: [2023-04-29 11:26:46,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 11:26:46,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 11:26:46,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +51: [2023-04-29 11:26:46,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 11:26:46,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +17: [2023-04-29 11:26:46,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 11:26:46,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +50: [2023-04-29 11:26:46,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 11:26:46,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 11:26:46,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +26: [2023-04-29 11:26:46,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +26: [2023-04-29 11:26:46,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +26: [2023-04-29 11:26:46,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +14: [2023-04-29 11:26:46,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 11:26:46,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +26: [2023-04-29 11:26:46,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 0: [2023-04-29 11:26:46,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +50: [2023-04-29 11:26:46,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +40: [2023-04-29 11:26:46,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 11:26:46,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 11:26:46,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 11:26:46,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +50: [2023-04-29 11:26:46,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +28: [2023-04-29 11:26:46,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 11:26:46,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 11:26:46,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +33: [2023-04-29 11:26:46,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +51: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +51: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. + 2: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +39: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +39: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. + 2: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 2: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 2: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 0: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +39: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. + 2: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +40: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +25: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +59: [2023-04-29 11:26:46,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +59: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +12: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +40: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +36: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +59: [2023-04-29 11:26:46,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 11:26:46,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +43: [2023-04-29 11:26:46,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +58: [2023-04-29 11:26:46,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 11:26:46,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 11:26:46,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +23: [2023-04-29 11:26:46,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 11:26:46,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +48: [2023-04-29 11:26:46,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +19: [2023-04-29 11:26:46,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +48: [2023-04-29 11:26:46,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +58: [2023-04-29 11:26:46,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +59: [2023-04-29 11:26:46,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +36: [2023-04-29 11:26:46,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +25: [2023-04-29 11:26:46,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 11:26:46,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 11:26:46,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +23: [2023-04-29 11:26:46,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +51: [2023-04-29 11:26:46,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +19: [2023-04-29 11:26:46,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +58: [2023-04-29 11:26:46,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +58: [2023-04-29 11:26:46,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +58: [2023-04-29 11:26:46,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 11:26:46,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 11:26:46,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +51: [2023-04-29 11:26:46,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +23: [2023-04-29 11:26:46,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +48: [2023-04-29 11:26:46,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +12: [2023-04-29 11:26:46,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 11:26:46,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +48: [2023-04-29 11:26:46,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 11:26:46,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 11:26:46,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +17: [2023-04-29 11:26:46,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 11:26:46,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 11:26:46,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 11:26:46,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 11:26:46,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +48: [2023-04-29 11:26:46,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +33: [2023-04-29 11:26:46,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 11:26:46,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 11:26:46,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +19: [2023-04-29 11:26:46,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 11:26:46,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 11:26:46,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +40: [2023-04-29 11:26:46,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +20: [2023-04-29 11:26:46,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +26: [2023-04-29 11:26:46,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +26: [2023-04-29 11:26:46,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 11:26:46,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +26: [2023-04-29 11:26:46,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 11:26:46,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +20: [2023-04-29 11:26:46,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 4: [2023-04-29 11:26:46,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 11:26:46,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. +22: [2023-04-29 11:26:46,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_10-model_01-model_states.pt. + 6: [2023-04-29 11:26:46,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +48: [2023-04-29 11:26:46,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 6: [2023-04-29 11:26:46,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +55: [2023-04-29 11:26:46,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +20: [2023-04-29 11:26:46,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +23: [2023-04-29 11:26:46,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +22: [2023-04-29 11:26:46,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:46,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +12: [2023-04-29 11:26:46,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 11:26:46,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +48: [2023-04-29 11:26:46,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +26: [2023-04-29 11:26:46,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 11:26:46,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 11:26:46,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +53: [2023-04-29 11:26:46,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +22: [2023-04-29 11:26:46,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +55: [2023-04-29 11:26:46,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 11:26:46,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +20: [2023-04-29 11:26:46,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 11:26:46,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 11:26:46,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 11:26:46,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 11:26:46,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 11:26:46,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:46,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 11:26:46,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:46,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:46,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +32: [2023-04-29 11:26:46,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 11:26:46,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 11:26:46,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +32: [2023-04-29 11:26:46,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 11:26:46,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 11:26:46,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +30: [2023-04-29 11:26:46,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +30: [2023-04-29 11:26:46,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +30: [2023-04-29 11:26:46,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +17: [2023-04-29 11:26:46,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 11:26:46,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +55: [2023-04-29 11:26:46,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +39: [2023-04-29 11:26:46,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 11:26:46,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 11:26:46,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +26: [2023-04-29 11:26:46,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 11:26:46,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +39: [2023-04-29 11:26:46,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +39: [2023-04-29 11:26:46,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +39: [2023-04-29 11:26:46,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +53: [2023-04-29 11:26:46,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +40: [2023-04-29 11:26:46,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 11:26:46,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 11:26:46,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +53: [2023-04-29 11:26:46,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +33: [2023-04-29 11:26:46,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +33: [2023-04-29 11:26:46,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 11:26:46,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +26: [2023-04-29 11:26:46,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 11:26:46,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +59: [2023-04-29 11:26:46,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 11:26:46,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 11:26:46,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 11:26:46,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 11:26:46,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +40: [2023-04-29 11:26:46,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 11:26:46,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 11:26:46,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +13: [2023-04-29 11:26:46,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +13: [2023-04-29 11:26:46,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +13: [2023-04-29 11:26:46,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +20: [2023-04-29 11:26:46,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +20: [2023-04-29 11:26:46,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +34: [2023-04-29 11:26:46,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 11:26:46,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 11:26:46,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 11:26:46,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 11:26:46,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 11:26:46,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 11:26:46,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 11:26:46,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +48: [2023-04-29 11:26:46,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 11:26:46,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +58: [2023-04-29 11:26:46,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +58: [2023-04-29 11:26:46,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +58: [2023-04-29 11:26:46,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +45: [2023-04-29 11:26:46,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 11:26:46,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +45: [2023-04-29 11:26:46,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 11:26:46,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +48: [2023-04-29 11:26:46,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 11:26:46,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 3: [2023-04-29 11:26:46,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +45: [2023-04-29 11:26:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +45: [2023-04-29 11:26:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 11:26:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +63: [2023-04-29 11:26:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +63: [2023-04-29 11:26:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +59: [2023-04-29 11:26:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +59: [2023-04-29 11:26:46,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 11:26:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. + 3: [2023-04-29 11:26:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +31: [2023-04-29 11:26:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +31: [2023-04-29 11:26:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +31: [2023-04-29 11:26:46,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +53: [2023-04-29 11:26:46,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +20: [2023-04-29 11:26:46,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +31: [2023-04-29 11:26:46,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +48: [2023-04-29 11:26:46,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 11:26:46,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 11:26:46,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +34: [2023-04-29 11:26:46,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +48: [2023-04-29 11:26:46,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 11:26:46,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +50: [2023-04-29 11:26:46,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +50: [2023-04-29 11:26:46,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +50: [2023-04-29 11:26:46,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +45: [2023-04-29 11:26:46,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +34: [2023-04-29 11:26:46,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +10: [2023-04-29 11:26:46,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 11:26:46,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt... +11: [2023-04-29 11:26:46,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 11:26:46,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +30: [2023-04-29 11:26:46,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +31: [2023-04-29 11:26:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +31: [2023-04-29 11:26:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +31: [2023-04-29 11:26:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +34: [2023-04-29 11:26:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +30: [2023-04-29 11:26:46,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +45: [2023-04-29 11:26:46,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +30: [2023-04-29 11:26:46,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +34: [2023-04-29 11:26:46,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 11:26:46,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +34: [2023-04-29 11:26:46,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +36: [2023-04-29 11:26:46,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +30: [2023-04-29 11:26:46,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +34: [2023-04-29 11:26:46,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +34: [2023-04-29 11:26:46,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +28: [2023-04-29 11:26:46,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +45: [2023-04-29 11:26:46,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +45: [2023-04-29 11:26:46,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +14: [2023-04-29 11:26:46,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 11:26:46,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +53: [2023-04-29 11:26:46,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 11:26:46,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +46: [2023-04-29 11:26:46,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. + 1: [2023-04-29 11:26:46,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +32: [2023-04-29 11:26:46,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 11:26:46,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +53: [2023-04-29 11:26:46,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +32: [2023-04-29 11:26:46,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 11:26:46,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 11:26:46,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 11:26:46,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 11:26:46,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +46: [2023-04-29 11:26:46,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +28: [2023-04-29 11:26:46,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +46: [2023-04-29 11:26:46,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +39: [2023-04-29 11:26:46,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 11:26:46,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +14: [2023-04-29 11:26:46,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +35: [2023-04-29 11:26:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +35: [2023-04-29 11:26:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +35: [2023-04-29 11:26:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +35: [2023-04-29 11:26:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +32: [2023-04-29 11:26:46,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +40: [2023-04-29 11:26:46,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 1: [2023-04-29 11:26:46,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 1: [2023-04-29 11:26:46,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 11:26:46,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +59: [2023-04-29 11:26:46,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 11:26:46,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 11:26:46,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 11:26:46,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +57: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +37: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +57: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +37: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +57: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +59: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +37: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +52: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. + 0: [2023-04-29 11:26:46,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 11:26:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +37: [2023-04-29 11:26:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 11:26:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 11:26:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 11:26:46,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +37: [2023-04-29 11:26:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 11:26:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 11:26:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 11:26:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +38: [2023-04-29 11:26:46,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. + 1: [2023-04-29 11:26:46,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +38: [2023-04-29 11:26:46,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +10: [2023-04-29 11:26:46,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +38: [2023-04-29 11:26:46,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +42: [2023-04-29 11:26:46,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +42: [2023-04-29 11:26:46,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +50: [2023-04-29 11:26:46,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 11:26:46,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 11:26:46,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 11:26:46,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +13: [2023-04-29 11:26:46,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +47: [2023-04-29 11:26:46,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +47: [2023-04-29 11:26:46,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +43: [2023-04-29 11:26:46,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 11:26:46,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 11:26:46,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +59: [2023-04-29 11:26:46,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +39: [2023-04-29 11:26:46,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +59: [2023-04-29 11:26:46,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +46: [2023-04-29 11:26:46,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +46: [2023-04-29 11:26:46,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 11:26:46,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 11:26:46,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +36: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +39: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +43: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +43: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +14: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +37: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +31: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +31: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +31: [2023-04-29 11:26:46,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +14: [2023-04-29 11:26:46,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +13: [2023-04-29 11:26:46,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +58: [2023-04-29 11:26:46,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 11:26:46,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. + 5: [2023-04-29 11:26:46,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +52: [2023-04-29 11:26:46,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +46: [2023-04-29 11:26:46,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 11:26:46,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +58: [2023-04-29 11:26:46,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +44: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +46: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 11:26:46,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +40: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +44: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +45: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +13: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +47: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +37: [2023-04-29 11:26:46,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 4: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 4: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 4: [2023-04-29 11:26:46,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 4: [2023-04-29 11:26:46,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 0: [2023-04-29 11:26:46,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +41: [2023-04-29 11:26:46,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +41: [2023-04-29 11:26:46,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +58: [2023-04-29 11:26:46,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +47: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +43: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +43: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +41: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +13: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +42: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +42: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +42: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 11:26:46,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +36: [2023-04-29 11:26:46,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +48: [2023-04-29 11:26:46,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 11:26:46,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +47: [2023-04-29 11:26:46,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +39: [2023-04-29 11:26:46,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +47: [2023-04-29 11:26:46,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 11:26:46,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +42: [2023-04-29 11:26:46,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 11:26:46,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +37: [2023-04-29 11:26:46,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +37: [2023-04-29 11:26:46,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +37: [2023-04-29 11:26:46,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 11:26:46,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 11:26:46,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 11:26:46,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +46: [2023-04-29 11:26:46,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +37: [2023-04-29 11:26:46,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +63: [2023-04-29 11:26:46,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +48: [2023-04-29 11:26:46,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 11:26:46,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 11:26:46,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +40: [2023-04-29 11:26:46,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 11:26:46,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 11:26:46,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 11:26:46,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 11:26:46,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 11:26:46,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 11:26:46,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +50: [2023-04-29 11:26:46,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +26: [2023-04-29 11:26:46,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +50: [2023-04-29 11:26:46,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 11:26:46,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +10: [2023-04-29 11:26:46,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +44: [2023-04-29 11:26:46,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 8: [2023-04-29 11:26:46,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +44: [2023-04-29 11:26:46,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 11:26:46,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 11:26:46,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +14: [2023-04-29 11:26:46,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +44: [2023-04-29 11:26:46,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +63: [2023-04-29 11:26:46,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +63: [2023-04-29 11:26:46,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +20: [2023-04-29 11:26:46,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +47: [2023-04-29 11:26:46,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +44: [2023-04-29 11:26:46,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 8: [2023-04-29 11:26:46,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +22: [2023-04-29 11:26:46,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 11:26:46,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 11:26:46,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +42: [2023-04-29 11:26:46,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +40: [2023-04-29 11:26:46,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 7: [2023-04-29 11:26:46,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +28: [2023-04-29 11:26:46,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +45: [2023-04-29 11:26:46,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 11:26:46,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +47: [2023-04-29 11:26:46,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 11:26:46,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +28: [2023-04-29 11:26:46,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +55: [2023-04-29 11:26:46,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +47: [2023-04-29 11:26:46,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 11:26:46,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +17: [2023-04-29 11:26:46,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +42: [2023-04-29 11:26:46,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +17: [2023-04-29 11:26:46,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +17: [2023-04-29 11:26:46,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +42: [2023-04-29 11:26:46,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +40: [2023-04-29 11:26:46,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +28: [2023-04-29 11:26:46,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +29: [2023-04-29 11:26:46,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +47: [2023-04-29 11:26:46,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 3: [2023-04-29 11:26:46,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +22: [2023-04-29 11:26:46,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +22: [2023-04-29 11:26:46,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +22: [2023-04-29 11:26:46,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 11:26:46,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +56: [2023-04-29 11:26:46,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +56: [2023-04-29 11:26:46,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +38: [2023-04-29 11:26:46,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 8: [2023-04-29 11:26:46,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 5: [2023-04-29 11:26:46,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +46: [2023-04-29 11:26:46,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 11:26:46,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 11:26:46,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 11:26:46,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +46: [2023-04-29 11:26:46,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 11:26:46,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_32-model_01-model_states.pt. +58: [2023-04-29 11:26:46,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 11:26:46,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +59: [2023-04-29 11:26:46,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 11:26:46,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +26: [2023-04-29 11:26:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +26: [2023-04-29 11:26:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 11:26:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +28: [2023-04-29 11:26:46,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +57: [2023-04-29 11:26:46,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +22: [2023-04-29 11:26:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +40: [2023-04-29 11:26:46,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +41: [2023-04-29 11:26:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 11:26:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +22: [2023-04-29 11:26:46,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +46: [2023-04-29 11:26:46,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 11:26:46,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 11:26:46,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 11:26:46,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +46: [2023-04-29 11:26:46,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 11:26:46,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 3: [2023-04-29 11:26:46,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +26: [2023-04-29 11:26:46,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +29: [2023-04-29 11:26:46,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 11:26:46,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +57: [2023-04-29 11:26:46,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +39: [2023-04-29 11:26:46,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 11:26:46,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 11:26:46,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 11:26:46,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 11:26:46,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 11:26:46,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +22: [2023-04-29 11:26:46,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +57: [2023-04-29 11:26:46,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 11:26:46,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 11:26:46,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 11:26:46,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +62: [2023-04-29 11:26:46,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +62: [2023-04-29 11:26:46,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +62: [2023-04-29 11:26:46,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +38: [2023-04-29 11:26:46,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +58: [2023-04-29 11:26:46,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 11:26:46,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 11:26:46,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +35: [2023-04-29 11:26:46,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 11:26:46,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 11:26:46,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +52: [2023-04-29 11:26:46,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 11:26:46,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 11:26:46,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +38: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +47: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 11:26:46,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +29: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 11:26:46,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +39: [2023-04-29 11:26:46,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +31: [2023-04-29 11:26:46,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +39: [2023-04-29 11:26:46,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 11:26:46,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 11:26:46,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +29: [2023-04-29 11:26:46,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +56: [2023-04-29 11:26:46,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 11:26:46,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 11:26:46,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +38: [2023-04-29 11:26:46,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 11:26:46,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 11:26:46,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 11:26:46,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +21: [2023-04-29 11:26:46,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +21: [2023-04-29 11:26:46,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +43: [2023-04-29 11:26:46,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 11:26:46,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +56: [2023-04-29 11:26:46,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 11:26:46,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 11:26:46,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +57: [2023-04-29 11:26:46,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 11:26:46,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +57: [2023-04-29 11:26:46,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 11:26:46,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +11: [2023-04-29 11:26:46,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +57: [2023-04-29 11:26:46,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +41: [2023-04-29 11:26:46,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +55: [2023-04-29 11:26:46,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +41: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 4: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +50: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +55: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +11: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 0: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +47: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +10: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +50: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 11:26:46,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +20: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +43: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +31: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +58: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +54: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +41: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +14: [2023-04-29 11:26:46,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +41: [2023-04-29 11:26:46,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 11:26:46,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 11:26:46,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +21: [2023-04-29 11:26:46,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +26: [2023-04-29 11:26:46,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +56: [2023-04-29 11:26:46,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 11:26:46,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 11:26:46,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +14: [2023-04-29 11:26:46,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +29: [2023-04-29 11:26:46,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +43: [2023-04-29 11:26:46,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 11:26:46,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +22: [2023-04-29 11:26:46,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +51: [2023-04-29 11:26:46,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 11:26:46,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +43: [2023-04-29 11:26:46,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +51: [2023-04-29 11:26:46,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +14: [2023-04-29 11:26:46,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +29: [2023-04-29 11:26:46,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +20: [2023-04-29 11:26:46,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 11:26:46,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +41: [2023-04-29 11:26:46,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 11:26:46,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +39: [2023-04-29 11:26:46,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +42: [2023-04-29 11:26:46,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 11:26:46,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +54: [2023-04-29 11:26:46,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 11:26:46,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 11:26:46,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 11:26:46,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 11:26:46,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +30: [2023-04-29 11:26:46,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +55: [2023-04-29 11:26:46,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 11:26:46,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +20: [2023-04-29 11:26:46,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +54: [2023-04-29 11:26:46,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 11:26:46,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 11:26:46,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +20: [2023-04-29 11:26:46,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +14: [2023-04-29 11:26:46,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +51: [2023-04-29 11:26:46,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 11:26:46,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +51: [2023-04-29 11:26:46,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +14: [2023-04-29 11:26:46,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +34: [2023-04-29 11:26:46,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +28: [2023-04-29 11:26:46,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +59: [2023-04-29 11:26:46,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +62: [2023-04-29 11:26:46,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 11:26:46,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 11:26:46,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +51: [2023-04-29 11:26:46,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +26: [2023-04-29 11:26:46,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +62: [2023-04-29 11:26:46,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +17: [2023-04-29 11:26:46,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +17: [2023-04-29 11:26:46,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +62: [2023-04-29 11:26:46,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +30: [2023-04-29 11:26:46,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +26: [2023-04-29 11:26:46,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +24: [2023-04-29 11:26:46,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 11:26:46,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 11:26:46,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 11:26:46,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +24: [2023-04-29 11:26:46,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +27: [2023-04-29 11:26:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +27: [2023-04-29 11:26:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +17: [2023-04-29 11:26:46,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 11:26:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 2: [2023-04-29 11:26:46,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +27: [2023-04-29 11:26:46,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +62: [2023-04-29 11:26:46,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 11:26:46,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 11:26:46,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +62: [2023-04-29 11:26:46,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +62: [2023-04-29 11:26:46,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +22: [2023-04-29 11:26:46,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +26: [2023-04-29 11:26:46,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +62: [2023-04-29 11:26:46,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 11:26:46,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +24: [2023-04-29 11:26:46,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +56: [2023-04-29 11:26:46,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +24: [2023-04-29 11:26:46,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 11:26:46,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +30: [2023-04-29 11:26:46,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +58: [2023-04-29 11:26:46,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +24: [2023-04-29 11:26:46,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 11:26:46,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +58: [2023-04-29 11:26:46,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +26: [2023-04-29 11:26:46,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 11:26:46,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 11:26:46,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +56: [2023-04-29 11:26:46,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +62: [2023-04-29 11:26:46,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +30: [2023-04-29 11:26:46,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +62: [2023-04-29 11:26:46,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 11:26:46,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +31: [2023-04-29 11:26:46,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +31: [2023-04-29 11:26:46,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +62: [2023-04-29 11:26:46,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +62: [2023-04-29 11:26:46,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +22: [2023-04-29 11:26:46,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 11:26:46,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 2: [2023-04-29 11:26:46,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +34: [2023-04-29 11:26:46,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 11:26:46,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +39: [2023-04-29 11:26:46,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +39: [2023-04-29 11:26:46,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 11:26:46,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +30: [2023-04-29 11:26:46,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +56: [2023-04-29 11:26:46,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +34: [2023-04-29 11:26:46,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 11:26:46,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +22: [2023-04-29 11:26:46,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +21: [2023-04-29 11:26:46,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +30: [2023-04-29 11:26:46,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 2: [2023-04-29 11:26:46,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +59: [2023-04-29 11:26:46,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +11: [2023-04-29 11:26:46,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +37: [2023-04-29 11:26:46,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +11: [2023-04-29 11:26:46,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +44: [2023-04-29 11:26:46,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 11:26:46,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt... +59: [2023-04-29 11:26:46,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +34: [2023-04-29 11:26:46,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +22: [2023-04-29 11:26:46,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 11:26:46,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +22: [2023-04-29 11:26:46,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +22: [2023-04-29 11:26:46,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 11:26:46,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +21: [2023-04-29 11:26:46,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 11:26:46,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_00-model_states.pt. +20: [2023-04-29 11:26:46,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +37: [2023-04-29 11:26:46,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +21: [2023-04-29 11:26:46,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 11:26:46,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +34: [2023-04-29 11:26:46,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +13: [2023-04-29 11:26:46,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 11:26:46,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +52: [2023-04-29 11:26:46,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 11:26:46,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 11:26:46,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 11:26:46,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +19: [2023-04-29 11:26:46,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +19: [2023-04-29 11:26:46,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +19: [2023-04-29 11:26:46,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +60: [2023-04-29 11:26:46,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 11:26:46,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 11:26:46,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 11:26:46,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +13: [2023-04-29 11:26:46,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +31: [2023-04-29 11:26:46,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +39: [2023-04-29 11:26:46,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +58: [2023-04-29 11:26:46,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 11:26:46,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 11:26:46,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 11:26:46,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +20: [2023-04-29 11:26:46,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +50: [2023-04-29 11:26:46,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 11:26:46,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +46: [2023-04-29 11:26:46,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +20: [2023-04-29 11:26:46,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt... +52: [2023-04-29 11:26:46,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +52: [2023-04-29 11:26:46,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +27: [2023-04-29 11:26:46,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +50: [2023-04-29 11:26:46,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +13: [2023-04-29 11:26:46,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 11:26:46,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 11:26:46,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +28: [2023-04-29 11:26:46,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +37: [2023-04-29 11:26:46,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 11:26:46,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +44: [2023-04-29 11:26:46,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 11:26:46,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 11:26:46,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 11:26:46,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +58: [2023-04-29 11:26:46,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +39: [2023-04-29 11:26:46,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 11:26:46,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +60: [2023-04-29 11:26:46,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 11:26:46,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +27: [2023-04-29 11:26:46,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +27: [2023-04-29 11:26:46,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +39: [2023-04-29 11:26:46,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +27: [2023-04-29 11:26:46,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +36: [2023-04-29 11:26:46,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +52: [2023-04-29 11:26:46,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 11:26:46,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 11:26:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 11:26:46,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +50: [2023-04-29 11:26:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 11:26:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 11:26:46,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +31: [2023-04-29 11:26:46,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +46: [2023-04-29 11:26:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 11:26:46,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 11:26:46,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +60: [2023-04-29 11:26:46,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +13: [2023-04-29 11:26:46,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +50: [2023-04-29 11:26:46,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +44: [2023-04-29 11:26:46,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +28: [2023-04-29 11:26:46,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +28: [2023-04-29 11:26:46,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +13: [2023-04-29 11:26:46,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +13: [2023-04-29 11:26:46,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +18: [2023-04-29 11:26:46,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +63: [2023-04-29 11:26:46,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 11:26:46,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 11:26:46,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 11:26:46,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 11:26:46,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +58: [2023-04-29 11:26:46,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 11:26:46,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 11:26:46,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 11:26:46,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +36: [2023-04-29 11:26:46,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 11:26:46,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +50: [2023-04-29 11:26:46,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +50: [2023-04-29 11:26:46,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +14: [2023-04-29 11:26:46,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +38: [2023-04-29 11:26:46,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +13: [2023-04-29 11:26:46,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +63: [2023-04-29 11:26:46,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 7: [2023-04-29 11:26:46,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +54: [2023-04-29 11:26:46,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +18: [2023-04-29 11:26:46,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +18: [2023-04-29 11:26:46,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +44: [2023-04-29 11:26:46,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +18: [2023-04-29 11:26:46,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +34: [2023-04-29 11:26:46,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 11:26:46,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +46: [2023-04-29 11:26:46,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +63: [2023-04-29 11:26:46,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +34: [2023-04-29 11:26:46,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +57: [2023-04-29 11:26:46,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 11:26:46,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 11:26:46,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 11:26:46,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 11:26:46,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +49: [2023-04-29 11:26:46,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +58: [2023-04-29 11:26:46,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +58: [2023-04-29 11:26:46,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +58: [2023-04-29 11:26:46,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +49: [2023-04-29 11:26:46,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 11:26:46,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 11:26:46,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +54: [2023-04-29 11:26:46,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +54: [2023-04-29 11:26:46,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +63: [2023-04-29 11:26:46,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +54: [2023-04-29 11:26:46,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +46: [2023-04-29 11:26:46,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 11:26:46,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 11:26:46,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 11:26:46,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 11:26:46,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 11:26:46,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 11:26:46,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +49: [2023-04-29 11:26:46,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +47: [2023-04-29 11:26:46,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 11:26:46,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +37: [2023-04-29 11:26:46,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +47: [2023-04-29 11:26:46,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 9: [2023-04-29 11:26:46,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 6: [2023-04-29 11:26:46,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 6: [2023-04-29 11:26:46,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 6: [2023-04-29 11:26:46,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +42: [2023-04-29 11:26:46,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +47: [2023-04-29 11:26:46,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 11:26:46,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +49: [2023-04-29 11:26:46,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +46: [2023-04-29 11:26:46,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 9: [2023-04-29 11:26:46,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +59: [2023-04-29 11:26:46,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +38: [2023-04-29 11:26:46,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 11:26:46,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 11:26:46,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +55: [2023-04-29 11:26:46,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +31: [2023-04-29 11:26:46,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +34: [2023-04-29 11:26:46,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +47: [2023-04-29 11:26:46,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +47: [2023-04-29 11:26:46,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +59: [2023-04-29 11:26:46,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 11:26:46,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 11:26:46,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +46: [2023-04-29 11:26:46,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 11:26:46,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 11:26:46,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +52: [2023-04-29 11:26:46,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +49: [2023-04-29 11:26:46,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +57: [2023-04-29 11:26:46,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +46: [2023-04-29 11:26:46,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +41: [2023-04-29 11:26:46,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 11:26:46,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 11:26:46,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +57: [2023-04-29 11:26:46,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 11:26:46,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 11:26:46,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 11:26:46,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +57: [2023-04-29 11:26:46,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +57: [2023-04-29 11:26:46,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +47: [2023-04-29 11:26:46,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +47: [2023-04-29 11:26:46,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +57: [2023-04-29 11:26:46,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +42: [2023-04-29 11:26:46,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +42: [2023-04-29 11:26:46,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 11:26:46,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 11:26:46,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +57: [2023-04-29 11:26:46,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +16: [2023-04-29 11:26:46,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 11:26:46,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +57: [2023-04-29 11:26:46,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +16: [2023-04-29 11:26:46,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 11:26:46,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 11:26:46,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +46: [2023-04-29 11:26:46,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +43: [2023-04-29 11:26:46,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 11:26:46,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 11:26:46,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 11:26:46,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 11:26:46,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +14: [2023-04-29 11:26:46,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +17: [2023-04-29 11:26:46,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +47: [2023-04-29 11:26:46,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +52: [2023-04-29 11:26:46,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 11:26:46,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 11:26:46,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 11:26:46,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +31: [2023-04-29 11:26:46,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 11:26:46,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +60: [2023-04-29 11:26:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +60: [2023-04-29 11:26:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +60: [2023-04-29 11:26:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +38: [2023-04-29 11:26:46,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 4: [2023-04-29 11:26:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +52: [2023-04-29 11:26:46,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +60: [2023-04-29 11:26:46,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +38: [2023-04-29 11:26:46,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +51: [2023-04-29 11:26:46,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 11:26:46,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +56: [2023-04-29 11:26:46,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +19: [2023-04-29 11:26:46,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 11:26:46,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +16: [2023-04-29 11:26:46,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +42: [2023-04-29 11:26:46,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +17: [2023-04-29 11:26:46,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +44: [2023-04-29 11:26:46,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 11:26:46,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +52: [2023-04-29 11:26:46,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +28: [2023-04-29 11:26:46,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +52: [2023-04-29 11:26:46,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 4: [2023-04-29 11:26:46,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +17: [2023-04-29 11:26:46,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +46: [2023-04-29 11:26:46,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +16: [2023-04-29 11:26:46,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +39: [2023-04-29 11:26:46,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:46,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +14: [2023-04-29 11:26:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +38: [2023-04-29 11:26:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +16: [2023-04-29 11:26:46,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +43: [2023-04-29 11:26:46,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 11:26:46,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 11:26:46,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 11:26:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +37: [2023-04-29 11:26:46,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +37: [2023-04-29 11:26:46,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +51: [2023-04-29 11:26:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 11:26:46,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +16: [2023-04-29 11:26:46,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +56: [2023-04-29 11:26:46,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +52: [2023-04-29 11:26:46,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +41: [2023-04-29 11:26:46,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +41: [2023-04-29 11:26:46,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +28: [2023-04-29 11:26:46,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +46: [2023-04-29 11:26:46,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +62: [2023-04-29 11:26:46,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +28: [2023-04-29 11:26:46,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 11:26:46,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +14: [2023-04-29 11:26:46,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +39: [2023-04-29 11:26:46,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +17: [2023-04-29 11:26:46,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +51: [2023-04-29 11:26:46,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 11:26:46,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +38: [2023-04-29 11:26:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +38: [2023-04-29 11:26:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +21: [2023-04-29 11:26:46,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +56: [2023-04-29 11:26:46,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +29: [2023-04-29 11:26:46,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +29: [2023-04-29 11:26:46,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +29: [2023-04-29 11:26:46,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +14: [2023-04-29 11:26:46,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +24: [2023-04-29 11:26:46,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 11:26:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +44: [2023-04-29 11:26:46,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 11:26:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +29: [2023-04-29 11:26:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 11:26:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +31: [2023-04-29 11:26:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +31: [2023-04-29 11:26:46,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +39: [2023-04-29 11:26:46,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:46,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +17: [2023-04-29 11:26:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +46: [2023-04-29 11:26:46,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +54: [2023-04-29 11:26:46,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +22: [2023-04-29 11:26:46,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +22: [2023-04-29 11:26:46,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 11:26:46,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +46: [2023-04-29 11:26:46,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +62: [2023-04-29 11:26:46,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 11:26:46,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +49: [2023-04-29 11:26:46,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +38: [2023-04-29 11:26:46,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +55: [2023-04-29 11:26:46,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +24: [2023-04-29 11:26:46,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 11:26:46,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +41: [2023-04-29 11:26:46,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +17: [2023-04-29 11:26:46,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +54: [2023-04-29 11:26:46,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 11:26:46,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +14: [2023-04-29 11:26:46,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +38: [2023-04-29 11:26:46,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 11:26:46,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +25: [2023-04-29 11:26:46,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +29: [2023-04-29 11:26:46,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +38: [2023-04-29 11:26:46,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +29: [2023-04-29 11:26:46,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +54: [2023-04-29 11:26:46,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 11:26:46,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 7: [2023-04-29 11:26:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 11:26:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +54: [2023-04-29 11:26:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 11:26:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +54: [2023-04-29 11:26:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +29: [2023-04-29 11:26:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 11:26:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +54: [2023-04-29 11:26:46,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +42: [2023-04-29 11:26:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +55: [2023-04-29 11:26:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +29: [2023-04-29 11:26:46,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +62: [2023-04-29 11:26:46,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 11:26:46,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 11:26:46,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +22: [2023-04-29 11:26:46,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +22: [2023-04-29 11:26:46,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +38: [2023-04-29 11:26:46,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 11:26:46,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +25: [2023-04-29 11:26:46,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 6: [2023-04-29 11:26:46,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +49: [2023-04-29 11:26:46,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +62: [2023-04-29 11:26:46,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 11:26:46,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +17: [2023-04-29 11:26:46,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +41: [2023-04-29 11:26:46,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +55: [2023-04-29 11:26:46,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +47: [2023-04-29 11:26:46,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +21: [2023-04-29 11:26:46,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +57: [2023-04-29 11:26:46,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 11:26:46,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +47: [2023-04-29 11:26:46,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +60: [2023-04-29 11:26:46,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 11:26:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 11:26:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 11:26:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +11: [2023-04-29 11:26:46,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +42: [2023-04-29 11:26:46,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +41: [2023-04-29 11:26:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 11:26:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +42: [2023-04-29 11:26:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 11:26:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +60: [2023-04-29 11:26:46,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 11:26:46,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +63: [2023-04-29 11:26:46,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +63: [2023-04-29 11:26:46,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 11:26:46,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 11:26:46,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 11:26:46,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +62: [2023-04-29 11:26:46,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +57: [2023-04-29 11:26:46,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +61: [2023-04-29 11:26:46,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +61: [2023-04-29 11:26:46,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +61: [2023-04-29 11:26:46,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +62: [2023-04-29 11:26:46,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +57: [2023-04-29 11:26:46,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +61: [2023-04-29 11:26:46,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +21: [2023-04-29 11:26:46,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +60: [2023-04-29 11:26:46,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 11:26:46,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +43: [2023-04-29 11:26:46,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +62: [2023-04-29 11:26:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 11:26:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +15: [2023-04-29 11:26:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 11:26:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 11:26:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +46: [2023-04-29 11:26:46,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 11:26:46,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 11:26:46,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +15: [2023-04-29 11:26:46,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +42: [2023-04-29 11:26:46,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 11:26:46,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +41: [2023-04-29 11:26:46,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 11:26:46,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +11: [2023-04-29 11:26:46,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +22: [2023-04-29 11:26:46,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 3: [2023-04-29 11:26:46,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +47: [2023-04-29 11:26:46,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +27: [2023-04-29 11:26:46,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +21: [2023-04-29 11:26:46,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +63: [2023-04-29 11:26:46,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 11:26:46,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +22: [2023-04-29 11:26:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +60: [2023-04-29 11:26:46,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +21: [2023-04-29 11:26:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +54: [2023-04-29 11:26:46,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +43: [2023-04-29 11:26:46,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 11:26:46,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 11:26:46,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 11:26:46,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 11:26:46,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +15: [2023-04-29 11:26:46,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 11:26:46,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 11:26:46,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 11:26:46,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 11:26:46,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +62: [2023-04-29 11:26:46,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:46,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +62: [2023-04-29 11:26:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +42: [2023-04-29 11:26:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +62: [2023-04-29 11:26:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +43: [2023-04-29 11:26:46,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 11:26:46,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +56: [2023-04-29 11:26:46,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +13: [2023-04-29 11:26:46,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +13: [2023-04-29 11:26:46,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +13: [2023-04-29 11:26:46,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 11:26:46,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +13: [2023-04-29 11:26:46,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +56: [2023-04-29 11:26:46,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +52: [2023-04-29 11:26:46,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +24: [2023-04-29 11:26:46,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +51: [2023-04-29 11:26:46,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 11:26:46,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +21: [2023-04-29 11:26:46,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +38: [2023-04-29 11:26:46,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +27: [2023-04-29 11:26:46,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +11: [2023-04-29 11:26:46,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 11:26:46,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +51: [2023-04-29 11:26:46,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 11:26:46,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +24: [2023-04-29 11:26:46,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 11:26:46,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +21: [2023-04-29 11:26:46,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +62: [2023-04-29 11:26:46,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 11:26:46,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +22: [2023-04-29 11:26:46,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +27: [2023-04-29 11:26:46,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +11: [2023-04-29 11:26:46,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 11:26:46,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 11:26:46,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +36: [2023-04-29 11:26:46,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +13: [2023-04-29 11:26:46,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 11:26:46,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 11:26:46,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +56: [2023-04-29 11:26:46,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +52: [2023-04-29 11:26:46,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +54: [2023-04-29 11:26:46,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +27: [2023-04-29 11:26:46,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +11: [2023-04-29 11:26:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 5: [2023-04-29 11:26:46,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +24: [2023-04-29 11:26:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 11:26:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 11:26:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +11: [2023-04-29 11:26:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +54: [2023-04-29 11:26:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 11:26:46,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_00-model_states.pt. +55: [2023-04-29 11:26:46,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. + 5: [2023-04-29 11:26:46,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +62: [2023-04-29 11:26:46,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +62: [2023-04-29 11:26:46,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 11:26:46,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... +35: [2023-04-29 11:26:46,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 11:26:46,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +18: [2023-04-29 11:26:46,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +52: [2023-04-29 11:26:46,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 11:26:46,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 11:26:46,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 11:26:46,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 11:26:46,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 11:26:46,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 11:26:46,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +25: [2023-04-29 11:26:46,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +25: [2023-04-29 11:26:46,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +11: [2023-04-29 11:26:46,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +27: [2023-04-29 11:26:46,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +60: [2023-04-29 11:26:46,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 11:26:46,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 11:26:46,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 11:26:46,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +52: [2023-04-29 11:26:46,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +18: [2023-04-29 11:26:46,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +56: [2023-04-29 11:26:46,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt... + 1: [2023-04-29 11:26:46,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 11:26:46,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +35: [2023-04-29 11:26:46,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +61: [2023-04-29 11:26:46,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +35: [2023-04-29 11:26:46,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +60: [2023-04-29 11:26:46,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 11:26:46,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 11:26:46,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +27: [2023-04-29 11:26:46,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +35: [2023-04-29 11:26:46,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 11:26:46,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +35: [2023-04-29 11:26:46,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +35: [2023-04-29 11:26:46,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +60: [2023-04-29 11:26:46,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +35: [2023-04-29 11:26:46,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +61: [2023-04-29 11:26:46,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +52: [2023-04-29 11:26:46,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +61: [2023-04-29 11:26:46,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 11:26:46,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 11:26:46,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +49: [2023-04-29 11:26:46,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +19: [2023-04-29 11:26:46,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +19: [2023-04-29 11:26:46,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 11:26:46,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +19: [2023-04-29 11:26:46,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +36: [2023-04-29 11:26:46,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 11:26:46,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +52: [2023-04-29 11:26:46,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +49: [2023-04-29 11:26:46,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 11:26:46,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +19: [2023-04-29 11:26:46,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +19: [2023-04-29 11:26:46,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +19: [2023-04-29 11:26:46,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +52: [2023-04-29 11:26:46,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +16: [2023-04-29 11:26:46,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +49: [2023-04-29 11:26:46,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +16: [2023-04-29 11:26:46,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 11:26:46,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 11:26:46,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +10: [2023-04-29 11:26:46,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +10: [2023-04-29 11:26:46,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +10: [2023-04-29 11:26:46,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 5: [2023-04-29 11:26:46,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +24: [2023-04-29 11:26:46,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +24: [2023-04-29 11:26:46,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +24: [2023-04-29 11:26:46,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +10: [2023-04-29 11:26:46,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +24: [2023-04-29 11:26:46,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +18: [2023-04-29 11:26:46,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +18: [2023-04-29 11:26:46,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 5: [2023-04-29 11:26:46,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +18: [2023-04-29 11:26:46,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +52: [2023-04-29 11:26:46,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +28: [2023-04-29 11:26:46,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +60: [2023-04-29 11:26:46,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +18: [2023-04-29 11:26:46,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 11:26:46,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 11:26:46,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 11:26:46,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +29: [2023-04-29 11:26:46,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +29: [2023-04-29 11:26:46,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +28: [2023-04-29 11:26:46,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +36: [2023-04-29 11:26:46,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +28: [2023-04-29 11:26:46,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +36: [2023-04-29 11:26:46,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +36: [2023-04-29 11:26:46,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 11:26:46,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +49: [2023-04-29 11:26:46,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +28: [2023-04-29 11:26:46,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +12: [2023-04-29 11:26:46,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 11:26:46,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +12: [2023-04-29 11:26:46,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +12: [2023-04-29 11:26:46,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +12: [2023-04-29 11:26:46,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 11:26:46,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +12: [2023-04-29 11:26:46,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +29: [2023-04-29 11:26:46,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +54: [2023-04-29 11:26:46,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 11:26:46,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 7: [2023-04-29 11:26:46,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +12: [2023-04-29 11:26:46,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 6: [2023-04-29 11:26:46,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +54: [2023-04-29 11:26:46,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 11:26:46,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +29: [2023-04-29 11:26:46,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +49: [2023-04-29 11:26:46,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +49: [2023-04-29 11:26:46,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +60: [2023-04-29 11:26:46,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +60: [2023-04-29 11:26:46,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +28: [2023-04-29 11:26:46,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +63: [2023-04-29 11:26:46,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 11:26:46,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 11:26:46,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 11:26:46,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 6: [2023-04-29 11:26:46,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +63: [2023-04-29 11:26:46,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +49: [2023-04-29 11:26:46,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +27: [2023-04-29 11:26:46,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 11:26:46,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 11:26:46,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +54: [2023-04-29 11:26:46,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +54: [2023-04-29 11:26:46,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +27: [2023-04-29 11:26:46,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 6: [2023-04-29 11:26:46,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +60: [2023-04-29 11:26:46,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +60: [2023-04-29 11:26:46,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 11:26:46,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +54: [2023-04-29 11:26:46,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 9: [2023-04-29 11:26:46,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 6: [2023-04-29 11:26:46,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +49: [2023-04-29 11:26:46,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 11:26:46,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +60: [2023-04-29 11:26:46,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +27: [2023-04-29 11:26:46,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 11:26:46,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 11:26:46,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 11:26:46,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +54: [2023-04-29 11:26:46,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 9: [2023-04-29 11:26:46,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +15: [2023-04-29 11:26:46,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 11:26:46,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +10: [2023-04-29 11:26:46,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 11:26:46,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 11:26:46,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 11:26:46,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 11:26:46,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +33: [2023-04-29 11:26:46,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 11:26:46,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +16: [2023-04-29 11:26:46,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:46,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 11:26:46,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +25: [2023-04-29 11:26:46,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 11:26:46,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 11:26:46,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 11:26:46,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +23: [2023-04-29 11:26:46,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +23: [2023-04-29 11:26:46,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +63: [2023-04-29 11:26:46,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +23: [2023-04-29 11:26:46,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +63: [2023-04-29 11:26:46,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 11:26:46,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +15: [2023-04-29 11:26:46,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +61: [2023-04-29 11:26:46,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 11:26:46,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 11:26:46,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 11:26:46,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +24: [2023-04-29 11:26:46,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +29: [2023-04-29 11:26:46,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:46,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +13: [2023-04-29 11:26:46,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +33: [2023-04-29 11:26:46,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 11:26:46,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 11:26:46,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +10: [2023-04-29 11:26:46,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +10: [2023-04-29 11:26:46,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 11:26:46,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 11:26:46,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +13: [2023-04-29 11:26:46,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +33: [2023-04-29 11:26:46,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +12: [2023-04-29 11:26:46,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 11:26:46,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +10: [2023-04-29 11:26:46,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +29: [2023-04-29 11:26:46,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 11:26:46,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 11:26:46,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +17: [2023-04-29 11:26:46,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +17: [2023-04-29 11:26:46,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 11:26:46,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +18: [2023-04-29 11:26:46,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 11:26:46,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 11:26:46,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 11:26:46,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 11:26:46,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 11:26:46,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 11:26:46,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 11:26:46,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +61: [2023-04-29 11:26:46,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +61: [2023-04-29 11:26:46,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 11:26:46,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +16: [2023-04-29 11:26:46,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 11:26:46,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +49: [2023-04-29 11:26:46,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +17: [2023-04-29 11:26:46,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 11:26:46,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 11:26:46,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 11:26:46,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 11:26:46,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 11:26:46,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 11:26:46,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +60: [2023-04-29 11:26:46,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +63: [2023-04-29 11:26:46,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 11:26:46,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +29: [2023-04-29 11:26:46,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 11:26:46,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 11:26:46,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 11:26:46,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 7: [2023-04-29 11:26:46,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +63: [2023-04-29 11:26:46,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +25: [2023-04-29 11:26:46,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +35: [2023-04-29 11:26:46,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +13: [2023-04-29 11:26:46,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +49: [2023-04-29 11:26:46,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +25: [2023-04-29 11:26:46,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +25: [2023-04-29 11:26:46,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +60: [2023-04-29 11:26:46,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +61: [2023-04-29 11:26:46,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +35: [2023-04-29 11:26:46,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 11:26:46,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +35: [2023-04-29 11:26:46,544] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +15: [2023-04-29 11:26:46,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 11:26:46,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 11:26:46,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 11:26:46,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +61: [2023-04-29 11:26:46,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +23: [2023-04-29 11:26:46,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 11:26:46,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +15: [2023-04-29 11:26:46,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 11:26:46,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 11:26:46,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +23: [2023-04-29 11:26:46,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +63: [2023-04-29 11:26:46,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 11:26:46,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +13: [2023-04-29 11:26:46,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +63: [2023-04-29 11:26:46,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 11:26:46,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +13: [2023-04-29 11:26:46,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +61: [2023-04-29 11:26:46,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 5: [2023-04-29 11:26:46,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 11:26:46,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +61: [2023-04-29 11:26:46,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +35: [2023-04-29 11:26:46,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +16: [2023-04-29 11:26:46,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +16: [2023-04-29 11:26:46,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +61: [2023-04-29 11:26:46,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 5: [2023-04-29 11:26:46,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +13: [2023-04-29 11:26:46,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +16: [2023-04-29 11:26:46,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +16: [2023-04-29 11:26:46,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 3: [2023-04-29 11:26:46,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +35: [2023-04-29 11:26:46,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +35: [2023-04-29 11:26:46,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +27: [2023-04-29 11:26:46,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 11:26:46,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 11:26:46,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +35: [2023-04-29 11:26:46,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 11:26:46,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 11:26:46,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 11:26:46,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 11:26:46,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +33: [2023-04-29 11:26:46,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +23: [2023-04-29 11:26:46,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 11:26:46,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +15: [2023-04-29 11:26:46,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +15: [2023-04-29 11:26:46,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +15: [2023-04-29 11:26:46,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +10: [2023-04-29 11:26:46,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 11:26:46,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 11:26:46,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +48: [2023-04-29 11:26:46,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 11:26:46,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +12: [2023-04-29 11:26:46,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 11:26:46,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 11:26:46,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 11:26:46,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +48: [2023-04-29 11:26:46,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 11:26:46,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +61: [2023-04-29 11:26:46,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 11:26:46,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +23: [2023-04-29 11:26:46,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 11:26:46,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +48: [2023-04-29 11:26:46,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 11:26:46,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +53: [2023-04-29 11:26:46,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +53: [2023-04-29 11:26:46,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +53: [2023-04-29 11:26:46,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +25: [2023-04-29 11:26:46,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +53: [2023-04-29 11:26:46,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 11:26:46,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +18: [2023-04-29 11:26:46,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +33: [2023-04-29 11:26:46,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +12: [2023-04-29 11:26:46,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +48: [2023-04-29 11:26:46,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +33: [2023-04-29 11:26:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +17: [2023-04-29 11:26:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +48: [2023-04-29 11:26:46,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +24: [2023-04-29 11:26:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 11:26:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 11:26:46,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 11:26:46,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 11:26:46,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +53: [2023-04-29 11:26:46,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 11:26:46,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 11:26:46,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 11:26:46,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 11:26:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 11:26:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +18: [2023-04-29 11:26:46,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +25: [2023-04-29 11:26:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 11:26:46,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +61: [2023-04-29 11:26:46,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +10: [2023-04-29 11:26:46,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 11:26:46,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +24: [2023-04-29 11:26:46,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +24: [2023-04-29 11:26:46,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +16: [2023-04-29 11:26:46,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 11:26:46,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +12: [2023-04-29 11:26:46,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +33: [2023-04-29 11:26:46,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +22: [2023-04-29 11:26:46,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 11:26:46,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 11:26:46,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 11:26:46,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 11:26:46,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 11:26:46,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +17: [2023-04-29 11:26:46,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 11:26:46,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 11:26:46,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +61: [2023-04-29 11:26:46,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 7: [2023-04-29 11:26:46,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 7: [2023-04-29 11:26:46,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +61: [2023-04-29 11:26:46,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +12: [2023-04-29 11:26:46,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +10: [2023-04-29 11:26:46,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +16: [2023-04-29 11:26:46,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +20: [2023-04-29 11:26:46,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +20: [2023-04-29 11:26:46,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +20: [2023-04-29 11:26:46,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +20: [2023-04-29 11:26:46,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_11-model_01-model_states.pt. +12: [2023-04-29 11:26:46,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +12: [2023-04-29 11:26:46,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 11:26:46,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +32: [2023-04-29 11:26:46,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +32: [2023-04-29 11:26:46,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. + 8: [2023-04-29 11:26:46,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 11:26:46,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +32: [2023-04-29 11:26:46,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +15: [2023-04-29 11:26:46,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +22: [2023-04-29 11:26:46,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +32: [2023-04-29 11:26:46,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +12: [2023-04-29 11:26:46,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 11:26:46,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 11:26:46,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 11:26:46,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 11:26:46,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +22: [2023-04-29 11:26:46,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 11:26:46,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 11:26:46,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 11:26:46,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +17: [2023-04-29 11:26:46,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 11:26:46,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 11:26:46,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +23: [2023-04-29 11:26:46,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 11:26:46,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 11:26:46,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 11:26:46,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 11:26:46,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 11:26:46,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +27: [2023-04-29 11:26:46,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 11:26:46,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 11:26:46,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +25: [2023-04-29 11:26:46,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:46,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +23: [2023-04-29 11:26:46,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +14: [2023-04-29 11:26:46,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 11:26:46,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +33: [2023-04-29 11:26:46,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +12: [2023-04-29 11:26:46,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 11:26:46,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 11:26:46,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +23: [2023-04-29 11:26:46,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 11:26:46,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +12: [2023-04-29 11:26:46,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 11:26:46,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 11:26:46,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 11:26:46,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 11:26:46,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +61: [2023-04-29 11:26:46,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +26: [2023-04-29 11:26:46,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 11:26:46,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 11:26:46,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +17: [2023-04-29 11:26:46,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:46,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +33: [2023-04-29 11:26:46,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +33: [2023-04-29 11:26:46,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +33: [2023-04-29 11:26:46,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +17: [2023-04-29 11:26:46,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +61: [2023-04-29 11:26:46,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +26: [2023-04-29 11:26:46,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 11:26:46,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 11:26:46,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +40: [2023-04-29 11:26:46,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 11:26:46,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 11:26:46,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 11:26:46,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +61: [2023-04-29 11:26:46,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +26: [2023-04-29 11:26:46,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 11:26:46,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +45: [2023-04-29 11:26:46,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +23: [2023-04-29 11:26:46,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +45: [2023-04-29 11:26:46,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 11:26:46,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 11:26:46,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +56: [2023-04-29 11:26:46,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +56: [2023-04-29 11:26:46,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +26: [2023-04-29 11:26:46,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +56: [2023-04-29 11:26:46,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +56: [2023-04-29 11:26:46,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_33-model_01-model_states.pt. +48: [2023-04-29 11:26:46,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 11:26:46,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 11:26:46,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 11:26:46,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 11:26:46,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 11:26:46,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +26: [2023-04-29 11:26:46,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 11:26:46,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +28: [2023-04-29 11:26:46,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 11:26:46,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 11:26:46,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +45: [2023-04-29 11:26:46,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +28: [2023-04-29 11:26:46,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 11:26:46,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 11:26:46,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +45: [2023-04-29 11:26:46,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +20: [2023-04-29 11:26:46,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt... +20: [2023-04-29 11:26:46,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +32: [2023-04-29 11:26:46,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +20: [2023-04-29 11:26:46,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +32: [2023-04-29 11:26:46,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 11:26:46,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 11:26:46,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +28: [2023-04-29 11:26:46,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +28: [2023-04-29 11:26:46,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +20: [2023-04-29 11:26:46,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +20: [2023-04-29 11:26:46,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +48: [2023-04-29 11:26:46,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 11:26:46,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +28: [2023-04-29 11:26:46,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +32: [2023-04-29 11:26:46,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +20: [2023-04-29 11:26:46,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 11:26:46,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 11:26:46,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +23: [2023-04-29 11:26:46,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 11:26:46,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 11:26:46,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +48: [2023-04-29 11:26:46,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +11: [2023-04-29 11:26:46,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 11:26:46,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +48: [2023-04-29 11:26:46,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +53: [2023-04-29 11:26:46,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +53: [2023-04-29 11:26:46,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:46,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +32: [2023-04-29 11:26:46,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 11:26:46,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 11:26:46,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 11:26:46,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:46,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +33: [2023-04-29 11:26:46,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +11: [2023-04-29 11:26:46,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:46,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +23: [2023-04-29 11:26:46,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 11:26:46,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +30: [2023-04-29 11:26:46,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +30: [2023-04-29 11:26:46,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +30: [2023-04-29 11:26:46,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +11: [2023-04-29 11:26:46,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 11:26:46,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +30: [2023-04-29 11:26:46,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +53: [2023-04-29 11:26:46,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +56: [2023-04-29 11:26:46,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +21: [2023-04-29 11:26:46,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 11:26:46,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 11:26:46,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +48: [2023-04-29 11:26:46,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +21: [2023-04-29 11:26:46,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 11:26:46,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +56: [2023-04-29 11:26:46,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +16: [2023-04-29 11:26:46,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +32: [2023-04-29 11:26:46,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +32: [2023-04-29 11:26:46,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 11:26:46,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 11:26:46,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 11:26:46,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 11:26:46,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 11:26:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +32: [2023-04-29 11:26:46,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 11:26:46,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +53: [2023-04-29 11:26:46,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +21: [2023-04-29 11:26:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 11:26:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +56: [2023-04-29 11:26:46,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +56: [2023-04-29 11:26:46,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt... +31: [2023-04-29 11:26:46,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 11:26:46,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 11:26:46,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 11:26:46,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 11:26:46,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 11:26:46,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 11:26:46,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 11:26:46,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +53: [2023-04-29 11:26:46,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +23: [2023-04-29 11:26:46,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 11:26:46,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +15: [2023-04-29 11:26:46,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +53: [2023-04-29 11:26:46,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +50: [2023-04-29 11:26:46,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 11:26:46,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +16: [2023-04-29 11:26:46,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 3: [2023-04-29 11:26:46,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 11:26:46,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 11:26:46,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 11:26:46,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 11:26:46,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +50: [2023-04-29 11:26:46,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 11:26:46,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 11:26:46,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +16: [2023-04-29 11:26:46,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 3: [2023-04-29 11:26:46,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +58: [2023-04-29 11:26:46,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 11:26:46,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 11:26:46,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +22: [2023-04-29 11:26:46,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 11:26:46,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 11:26:46,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +58: [2023-04-29 11:26:46,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +15: [2023-04-29 11:26:46,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 8: [2023-04-29 11:26:46,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 8: [2023-04-29 11:26:46,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 8: [2023-04-29 11:26:46,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +14: [2023-04-29 11:26:46,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +23: [2023-04-29 11:26:46,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +43: [2023-04-29 11:26:46,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +43: [2023-04-29 11:26:46,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +43: [2023-04-29 11:26:46,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +43: [2023-04-29 11:26:46,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +16: [2023-04-29 11:26:46,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 11:26:46,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 11:26:46,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 11:26:46,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 11:26:46,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +58: [2023-04-29 11:26:46,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +58: [2023-04-29 11:26:46,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +58: [2023-04-29 11:26:46,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +14: [2023-04-29 11:26:46,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +48: [2023-04-29 11:26:46,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 11:26:46,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +48: [2023-04-29 11:26:46,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +53: [2023-04-29 11:26:46,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +15: [2023-04-29 11:26:46,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +53: [2023-04-29 11:26:46,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 11:26:46,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +30: [2023-04-29 11:26:46,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 11:26:46,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +16: [2023-04-29 11:26:46,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +30: [2023-04-29 11:26:46,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 11:26:46,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +15: [2023-04-29 11:26:46,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +30: [2023-04-29 11:26:46,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +22: [2023-04-29 11:26:46,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +40: [2023-04-29 11:26:46,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +26: [2023-04-29 11:26:46,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +53: [2023-04-29 11:26:46,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +20: [2023-04-29 11:26:46,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 0: [2023-04-29 11:26:46,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 0: [2023-04-29 11:26:46,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 0: [2023-04-29 11:26:46,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +51: [2023-04-29 11:26:46,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +51: [2023-04-29 11:26:46,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +45: [2023-04-29 11:26:46,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 11:26:46,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +51: [2023-04-29 11:26:46,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +53: [2023-04-29 11:26:46,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 11:26:46,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +34: [2023-04-29 11:26:46,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +34: [2023-04-29 11:26:46,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +14: [2023-04-29 11:26:46,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +34: [2023-04-29 11:26:46,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +34: [2023-04-29 11:26:46,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +20: [2023-04-29 11:26:46,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +45: [2023-04-29 11:26:46,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +23: [2023-04-29 11:26:46,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 11:26:46,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +14: [2023-04-29 11:26:46,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +40: [2023-04-29 11:26:46,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +29: [2023-04-29 11:26:46,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +29: [2023-04-29 11:26:46,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +26: [2023-04-29 11:26:46,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 11:26:46,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 11:26:46,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +14: [2023-04-29 11:26:46,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +20: [2023-04-29 11:26:46,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +29: [2023-04-29 11:26:46,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +28: [2023-04-29 11:26:46,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +29: [2023-04-29 11:26:46,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +40: [2023-04-29 11:26:46,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +40: [2023-04-29 11:26:46,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +40: [2023-04-29 11:26:46,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +14: [2023-04-29 11:26:46,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +26: [2023-04-29 11:26:46,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 11:26:46,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +40: [2023-04-29 11:26:46,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +53: [2023-04-29 11:26:46,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 11:26:46,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +14: [2023-04-29 11:26:46,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 8: [2023-04-29 11:26:46,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +11: [2023-04-29 11:26:46,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +32: [2023-04-29 11:26:46,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 11:26:46,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 11:26:46,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 11:26:46,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +14: [2023-04-29 11:26:46,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +43: [2023-04-29 11:26:46,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +20: [2023-04-29 11:26:46,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... + 8: [2023-04-29 11:26:46,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +28: [2023-04-29 11:26:46,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 11:26:46,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +43: [2023-04-29 11:26:46,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 11:26:46,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +14: [2023-04-29 11:26:46,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +32: [2023-04-29 11:26:46,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +22: [2023-04-29 11:26:46,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 11:26:46,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +40: [2023-04-29 11:26:46,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 11:26:46,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +28: [2023-04-29 11:26:46,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 11:26:46,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 11:26:46,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:46,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 11:26:46,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +26: [2023-04-29 11:26:46,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +40: [2023-04-29 11:26:46,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +33: [2023-04-29 11:26:46,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 11:26:46,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +28: [2023-04-29 11:26:46,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 11:26:46,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_00-model_states.pt. +34: [2023-04-29 11:26:46,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +34: [2023-04-29 11:26:46,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +20: [2023-04-29 11:26:46,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +20: [2023-04-29 11:26:46,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +33: [2023-04-29 11:26:46,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +33: [2023-04-29 11:26:46,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +51: [2023-04-29 11:26:46,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +51: [2023-04-29 11:26:46,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 11:26:46,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +33: [2023-04-29 11:26:46,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 11:26:46,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 5: [2023-04-29 11:26:46,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +34: [2023-04-29 11:26:46,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +56: [2023-04-29 11:26:46,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +51: [2023-04-29 11:26:46,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +51: [2023-04-29 11:26:46,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 11:26:46,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +14: [2023-04-29 11:26:46,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 11:26:46,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 11:26:46,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +34: [2023-04-29 11:26:46,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +33: [2023-04-29 11:26:46,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +21: [2023-04-29 11:26:46,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +56: [2023-04-29 11:26:46,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +20: [2023-04-29 11:26:46,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt... +26: [2023-04-29 11:26:46,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 11:26:46,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 11:26:46,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 11:26:46,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 11:26:46,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 11:26:46,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +56: [2023-04-29 11:26:46,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +26: [2023-04-29 11:26:46,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +40: [2023-04-29 11:26:46,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +14: [2023-04-29 11:26:46,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 11:26:46,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 11:26:46,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 11:26:46,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +29: [2023-04-29 11:26:46,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 11:26:46,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +48: [2023-04-29 11:26:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +48: [2023-04-29 11:26:46,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +48: [2023-04-29 11:26:46,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +48: [2023-04-29 11:26:46,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +14: [2023-04-29 11:26:46,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +14: [2023-04-29 11:26:46,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 11:26:46,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 11:26:46,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +32: [2023-04-29 11:26:46,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 11:26:46,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +40: [2023-04-29 11:26:46,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 11:26:46,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +45: [2023-04-29 11:26:46,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 11:26:46,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +14: [2023-04-29 11:26:46,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +31: [2023-04-29 11:26:46,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 11:26:46,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 11:26:46,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 11:26:46,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 11:26:46,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +56: [2023-04-29 11:26:46,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +56: [2023-04-29 11:26:46,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_00-model_states.pt. +50: [2023-04-29 11:26:46,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 11:26:46,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +50: [2023-04-29 11:26:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 11:26:46,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +58: [2023-04-29 11:26:46,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 11:26:46,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +43: [2023-04-29 11:26:46,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 11:26:46,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +32: [2023-04-29 11:26:46,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 11:26:46,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +31: [2023-04-29 11:26:46,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 11:26:46,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 11:26:46,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +40: [2023-04-29 11:26:46,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 11:26:46,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +37: [2023-04-29 11:26:46,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +37: [2023-04-29 11:26:46,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +40: [2023-04-29 11:26:46,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +37: [2023-04-29 11:26:46,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. + 7: [2023-04-29 11:26:46,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +58: [2023-04-29 11:26:46,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +56: [2023-04-29 11:26:46,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... +56: [2023-04-29 11:26:46,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt... + 7: [2023-04-29 11:26:46,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +50: [2023-04-29 11:26:46,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 1: [2023-04-29 11:26:46,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +30: [2023-04-29 11:26:46,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 11:26:46,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 1: [2023-04-29 11:26:46,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 4: [2023-04-29 11:26:46,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +58: [2023-04-29 11:26:46,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 11:26:46,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +43: [2023-04-29 11:26:46,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +43: [2023-04-29 11:26:46,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 11:26:46,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +32: [2023-04-29 11:26:46,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 11:26:46,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 11:26:46,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 11:26:46,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +20: [2023-04-29 11:26:46,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 11:26:46,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +30: [2023-04-29 11:26:46,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +30: [2023-04-29 11:26:46,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +30: [2023-04-29 11:26:46,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +30: [2023-04-29 11:26:46,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +36: [2023-04-29 11:26:46,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +36: [2023-04-29 11:26:46,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +36: [2023-04-29 11:26:46,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +36: [2023-04-29 11:26:46,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +32: [2023-04-29 11:26:46,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +21: [2023-04-29 11:26:46,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +43: [2023-04-29 11:26:46,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 11:26:46,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +34: [2023-04-29 11:26:46,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 11:26:46,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 11:26:46,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 11:26:46,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +53: [2023-04-29 11:26:46,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +53: [2023-04-29 11:26:46,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 11:26:46,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +30: [2023-04-29 11:26:46,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +30: [2023-04-29 11:26:46,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +32: [2023-04-29 11:26:46,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +34: [2023-04-29 11:26:46,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +59: [2023-04-29 11:26:46,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 11:26:46,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 11:26:46,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 11:26:46,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +44: [2023-04-29 11:26:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +44: [2023-04-29 11:26:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +44: [2023-04-29 11:26:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 11:26:46,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +48: [2023-04-29 11:26:46,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 11:26:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 11:26:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 11:26:46,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 11:26:46,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 11:26:46,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 11:26:46,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +11: [2023-04-29 11:26:46,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +39: [2023-04-29 11:26:46,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +11: [2023-04-29 11:26:46,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +53: [2023-04-29 11:26:46,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +39: [2023-04-29 11:26:46,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 11:26:46,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 2: [2023-04-29 11:26:46,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +48: [2023-04-29 11:26:46,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 11:26:46,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +11: [2023-04-29 11:26:46,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +34: [2023-04-29 11:26:46,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +34: [2023-04-29 11:26:46,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +37: [2023-04-29 11:26:46,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 11:26:46,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +31: [2023-04-29 11:26:46,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +34: [2023-04-29 11:26:46,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 11:26:46,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +53: [2023-04-29 11:26:46,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +53: [2023-04-29 11:26:46,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 11:26:46,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 11:26:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +39: [2023-04-29 11:26:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +39: [2023-04-29 11:26:46,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 11:26:46,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 11:26:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 8: [2023-04-29 11:26:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +44: [2023-04-29 11:26:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +59: [2023-04-29 11:26:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +59: [2023-04-29 11:26:46,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +21: [2023-04-29 11:26:46,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +59: [2023-04-29 11:26:46,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 11:26:46,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 6: [2023-04-29 11:26:46,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 6: [2023-04-29 11:26:46,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +58: [2023-04-29 11:26:46,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 11:26:46,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +44: [2023-04-29 11:26:46,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +59: [2023-04-29 11:26:46,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +21: [2023-04-29 11:26:46,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +37: [2023-04-29 11:26:46,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 11:26:46,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 11:26:46,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 11:26:46,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +10: [2023-04-29 11:26:46,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 11:26:46,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 11:26:46,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 11:26:46,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 11:26:46,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 11:26:46,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 11:26:46,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 11:26:46,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +53: [2023-04-29 11:26:46,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +53: [2023-04-29 11:26:46,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +58: [2023-04-29 11:26:46,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 11:26:46,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +26: [2023-04-29 11:26:46,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +43: [2023-04-29 11:26:46,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +59: [2023-04-29 11:26:46,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +59: [2023-04-29 11:26:46,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +59: [2023-04-29 11:26:46,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +26: [2023-04-29 11:26:46,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +50: [2023-04-29 11:26:46,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +26: [2023-04-29 11:26:46,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 1: [2023-04-29 11:26:46,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +59: [2023-04-29 11:26:46,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +37: [2023-04-29 11:26:46,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 11:26:46,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 11:26:46,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +43: [2023-04-29 11:26:46,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +19: [2023-04-29 11:26:46,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +37: [2023-04-29 11:26:46,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +37: [2023-04-29 11:26:46,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 11:26:46,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +10: [2023-04-29 11:26:46,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 11:26:46,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +36: [2023-04-29 11:26:46,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 11:26:46,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 11:26:46,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +37: [2023-04-29 11:26:46,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 11:26:46,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 11:26:46,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +36: [2023-04-29 11:26:46,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 11:26:46,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 11:26:46,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 11:26:46,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +37: [2023-04-29 11:26:46,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 11:26:46,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 11:26:46,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 11:26:46,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +43: [2023-04-29 11:26:46,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +37: [2023-04-29 11:26:46,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 11:26:46,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +32: [2023-04-29 11:26:46,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +17: [2023-04-29 11:26:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +17: [2023-04-29 11:26:46,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +17: [2023-04-29 11:26:46,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 0: [2023-04-29 11:26:46,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +17: [2023-04-29 11:26:46,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 8: [2023-04-29 11:26:46,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 8: [2023-04-29 11:26:46,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +38: [2023-04-29 11:26:46,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 11:26:46,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 8: [2023-04-29 11:26:46,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +43: [2023-04-29 11:26:46,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +43: [2023-04-29 11:26:46,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +38: [2023-04-29 11:26:46,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 11:26:46,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 11:26:46,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +14: [2023-04-29 11:26:46,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +62: [2023-04-29 11:26:46,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +62: [2023-04-29 11:26:46,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +62: [2023-04-29 11:26:46,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +62: [2023-04-29 11:26:46,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +29: [2023-04-29 11:26:46,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +42: [2023-04-29 11:26:46,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +42: [2023-04-29 11:26:46,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +29: [2023-04-29 11:26:46,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +38: [2023-04-29 11:26:46,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +38: [2023-04-29 11:26:46,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +51: [2023-04-29 11:26:46,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 11:26:46,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +34: [2023-04-29 11:26:46,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 11:26:46,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +42: [2023-04-29 11:26:46,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 11:26:46,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 11:26:46,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 11:26:46,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 11:26:46,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 11:26:46,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 0: [2023-04-29 11:26:46,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +14: [2023-04-29 11:26:46,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +51: [2023-04-29 11:26:46,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +62: [2023-04-29 11:26:46,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +29: [2023-04-29 11:26:46,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +29: [2023-04-29 11:26:46,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +62: [2023-04-29 11:26:46,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +42: [2023-04-29 11:26:46,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +51: [2023-04-29 11:26:46,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +51: [2023-04-29 11:26:46,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +32: [2023-04-29 11:26:46,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +34: [2023-04-29 11:26:46,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +34: [2023-04-29 11:26:46,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +32: [2023-04-29 11:26:46,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +59: [2023-04-29 11:26:46,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +32: [2023-04-29 11:26:46,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 11:26:46,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 11:26:46,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +62: [2023-04-29 11:26:46,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +62: [2023-04-29 11:26:46,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +14: [2023-04-29 11:26:46,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +14: [2023-04-29 11:26:46,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +51: [2023-04-29 11:26:46,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +26: [2023-04-29 11:26:46,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +59: [2023-04-29 11:26:46,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +59: [2023-04-29 11:26:46,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +42: [2023-04-29 11:26:46,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 11:26:46,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +55: [2023-04-29 11:26:46,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +55: [2023-04-29 11:26:46,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +55: [2023-04-29 11:26:46,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +62: [2023-04-29 11:26:46,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +40: [2023-04-29 11:26:46,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +46: [2023-04-29 11:26:46,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 11:26:46,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 11:26:46,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +46: [2023-04-29 11:26:46,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 11:26:46,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 11:26:46,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +54: [2023-04-29 11:26:46,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 11:26:46,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 11:26:46,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 11:26:46,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 11:26:46,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 11:26:46,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 11:26:46,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 11:26:46,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +26: [2023-04-29 11:26:46,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +55: [2023-04-29 11:26:46,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 11:26:46,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 11:26:46,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +57: [2023-04-29 11:26:46,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +57: [2023-04-29 11:26:46,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +57: [2023-04-29 11:26:46,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +14: [2023-04-29 11:26:46,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +14: [2023-04-29 11:26:46,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +59: [2023-04-29 11:26:46,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 11:26:46,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 11:26:46,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +56: [2023-04-29 11:26:46,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +56: [2023-04-29 11:26:46,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 11:26:46,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +51: [2023-04-29 11:26:46,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +51: [2023-04-29 11:26:46,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +29: [2023-04-29 11:26:46,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +51: [2023-04-29 11:26:46,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 11:26:46,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 0: [2023-04-29 11:26:46,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +46: [2023-04-29 11:26:46,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 11:26:46,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +54: [2023-04-29 11:26:46,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +26: [2023-04-29 11:26:46,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +46: [2023-04-29 11:26:46,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 11:26:46,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 11:26:46,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 11:26:46,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 11:26:46,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 11:26:46,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +14: [2023-04-29 11:26:46,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +26: [2023-04-29 11:26:46,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +46: [2023-04-29 11:26:46,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +13: [2023-04-29 11:26:46,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +13: [2023-04-29 11:26:46,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +55: [2023-04-29 11:26:46,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 11:26:46,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 11:26:46,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 11:26:46,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 11:26:46,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +13: [2023-04-29 11:26:46,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +17: [2023-04-29 11:26:46,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +56: [2023-04-29 11:26:46,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +13: [2023-04-29 11:26:46,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +17: [2023-04-29 11:26:46,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +56: [2023-04-29 11:26:46,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +17: [2023-04-29 11:26:46,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +49: [2023-04-29 11:26:46,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 11:26:46,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 11:26:46,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +43: [2023-04-29 11:26:46,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +51: [2023-04-29 11:26:46,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 11:26:46,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +29: [2023-04-29 11:26:46,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +56: [2023-04-29 11:26:46,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 11:26:46,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +56: [2023-04-29 11:26:46,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 11:26:46,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 11:26:46,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +51: [2023-04-29 11:26:46,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +17: [2023-04-29 11:26:46,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +51: [2023-04-29 11:26:46,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +29: [2023-04-29 11:26:46,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +57: [2023-04-29 11:26:46,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +49: [2023-04-29 11:26:46,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 11:26:46,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +55: [2023-04-29 11:26:46,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +43: [2023-04-29 11:26:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 11:26:46,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 11:26:46,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 11:26:46,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 11:26:46,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:46,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 11:26:46,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:46,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +30: [2023-04-29 11:26:46,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 11:26:46,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 11:26:46,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 11:26:46,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +47: [2023-04-29 11:26:46,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +47: [2023-04-29 11:26:46,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 11:26:46,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +30: [2023-04-29 11:26:46,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +40: [2023-04-29 11:26:46,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +34: [2023-04-29 11:26:46,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 11:26:46,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +40: [2023-04-29 11:26:46,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +62: [2023-04-29 11:26:46,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +40: [2023-04-29 11:26:46,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 4: [2023-04-29 11:26:46,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 11:26:46,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +44: [2023-04-29 11:26:46,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 11:26:46,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +19: [2023-04-29 11:26:46,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +19: [2023-04-29 11:26:46,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +62: [2023-04-29 11:26:46,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 11:26:46,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 11:26:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +30: [2023-04-29 11:26:46,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +62: [2023-04-29 11:26:46,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 11:26:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 2: [2023-04-29 11:26:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 2: [2023-04-29 11:26:46,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +34: [2023-04-29 11:26:46,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 2: [2023-04-29 11:26:46,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +30: [2023-04-29 11:26:46,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 11:26:46,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +47: [2023-04-29 11:26:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +63: [2023-04-29 11:26:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 11:26:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +19: [2023-04-29 11:26:46,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +63: [2023-04-29 11:26:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +30: [2023-04-29 11:26:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +30: [2023-04-29 11:26:46,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +55: [2023-04-29 11:26:46,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +47: [2023-04-29 11:26:46,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 4: [2023-04-29 11:26:46,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +47: [2023-04-29 11:26:46,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +48: [2023-04-29 11:26:46,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +43: [2023-04-29 11:26:46,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +47: [2023-04-29 11:26:46,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +39: [2023-04-29 11:26:46,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 9: [2023-04-29 11:26:46,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 9: [2023-04-29 11:26:46,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 9: [2023-04-29 11:26:46,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +16: [2023-04-29 11:26:46,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 11:26:46,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 11:26:46,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 11:26:46,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +48: [2023-04-29 11:26:46,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +46: [2023-04-29 11:26:46,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +46: [2023-04-29 11:26:46,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +46: [2023-04-29 11:26:46,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +54: [2023-04-29 11:26:46,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +54: [2023-04-29 11:26:46,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +46: [2023-04-29 11:26:46,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. + 4: [2023-04-29 11:26:46,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 1: [2023-04-29 11:26:46,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +54: [2023-04-29 11:26:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +44: [2023-04-29 11:26:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +44: [2023-04-29 11:26:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +54: [2023-04-29 11:26:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +39: [2023-04-29 11:26:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 11:26:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +28: [2023-04-29 11:26:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +28: [2023-04-29 11:26:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +48: [2023-04-29 11:26:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 11:26:46,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +55: [2023-04-29 11:26:46,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +16: [2023-04-29 11:26:46,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +44: [2023-04-29 11:26:46,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +36: [2023-04-29 11:26:46,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +16: [2023-04-29 11:26:46,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +34: [2023-04-29 11:26:46,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 11:26:46,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +28: [2023-04-29 11:26:46,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +44: [2023-04-29 11:26:46,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +52: [2023-04-29 11:26:46,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +52: [2023-04-29 11:26:46,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +28: [2023-04-29 11:26:46,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +39: [2023-04-29 11:26:46,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 11:26:46,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +16: [2023-04-29 11:26:46,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 11:26:46,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +35: [2023-04-29 11:26:46,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +10: [2023-04-29 11:26:46,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +55: [2023-04-29 11:26:46,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +16: [2023-04-29 11:26:46,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +52: [2023-04-29 11:26:46,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +52: [2023-04-29 11:26:46,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +35: [2023-04-29 11:26:46,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +43: [2023-04-29 11:26:46,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +36: [2023-04-29 11:26:46,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +13: [2023-04-29 11:26:46,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +35: [2023-04-29 11:26:46,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 11:26:46,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 4: [2023-04-29 11:26:46,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +48: [2023-04-29 11:26:46,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +52: [2023-04-29 11:26:46,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 11:26:46,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 11:26:46,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +60: [2023-04-29 11:26:46,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +60: [2023-04-29 11:26:46,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +44: [2023-04-29 11:26:46,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +52: [2023-04-29 11:26:46,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 11:26:46,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +37: [2023-04-29 11:26:46,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 11:26:46,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 11:26:46,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +13: [2023-04-29 11:26:46,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +43: [2023-04-29 11:26:46,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 11:26:46,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +13: [2023-04-29 11:26:46,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +52: [2023-04-29 11:26:46,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +52: [2023-04-29 11:26:46,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 11:26:46,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +41: [2023-04-29 11:26:46,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 11:26:46,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +35: [2023-04-29 11:26:46,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +34: [2023-04-29 11:26:46,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +36: [2023-04-29 11:26:46,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 11:26:46,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +60: [2023-04-29 11:26:46,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +35: [2023-04-29 11:26:46,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +35: [2023-04-29 11:26:46,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +44: [2023-04-29 11:26:46,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 3: [2023-04-29 11:26:46,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 3: [2023-04-29 11:26:46,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 3: [2023-04-29 11:26:46,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +13: [2023-04-29 11:26:46,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +36: [2023-04-29 11:26:46,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +36: [2023-04-29 11:26:46,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +41: [2023-04-29 11:26:46,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +41: [2023-04-29 11:26:46,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 11:26:46,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +35: [2023-04-29 11:26:46,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 11:26:46,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +36: [2023-04-29 11:26:46,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +19: [2023-04-29 11:26:46,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 11:26:46,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 11:26:46,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +41: [2023-04-29 11:26:46,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +41: [2023-04-29 11:26:46,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 11:26:46,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +34: [2023-04-29 11:26:46,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 11:26:46,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 1: [2023-04-29 11:26:46,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +47: [2023-04-29 11:26:46,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +47: [2023-04-29 11:26:46,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +10: [2023-04-29 11:26:46,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +41: [2023-04-29 11:26:46,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +36: [2023-04-29 11:26:46,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +36: [2023-04-29 11:26:46,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +11: [2023-04-29 11:26:46,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +43: [2023-04-29 11:26:46,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 11:26:46,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +11: [2023-04-29 11:26:46,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +34: [2023-04-29 11:26:46,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +11: [2023-04-29 11:26:46,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 9: [2023-04-29 11:26:46,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +39: [2023-04-29 11:26:46,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +11: [2023-04-29 11:26:46,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +41: [2023-04-29 11:26:46,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +47: [2023-04-29 11:26:46,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +22: [2023-04-29 11:26:46,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +22: [2023-04-29 11:26:46,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +47: [2023-04-29 11:26:46,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +31: [2023-04-29 11:26:46,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +31: [2023-04-29 11:26:46,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +31: [2023-04-29 11:26:46,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +31: [2023-04-29 11:26:46,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +22: [2023-04-29 11:26:46,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 9: [2023-04-29 11:26:46,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 11:26:46,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 2: [2023-04-29 11:26:46,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +38: [2023-04-29 11:26:46,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 11:26:46,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 11:26:46,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 11:26:46,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +59: [2023-04-29 11:26:46,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +54: [2023-04-29 11:26:46,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +46: [2023-04-29 11:26:46,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 7: [2023-04-29 11:26:46,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 11:26:46,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 11:26:46,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +42: [2023-04-29 11:26:46,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 11:26:46,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 11:26:46,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 11:26:46,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 11:26:46,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +28: [2023-04-29 11:26:46,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 11:26:46,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +24: [2023-04-29 11:26:46,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +24: [2023-04-29 11:26:46,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +37: [2023-04-29 11:26:46,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 11:26:46,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 11:26:46,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +37: [2023-04-29 11:26:46,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +24: [2023-04-29 11:26:46,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +10: [2023-04-29 11:26:46,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 11:26:46,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 11:26:46,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +46: [2023-04-29 11:26:46,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +28: [2023-04-29 11:26:46,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +28: [2023-04-29 11:26:46,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +46: [2023-04-29 11:26:46,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +19: [2023-04-29 11:26:46,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 11:26:46,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +42: [2023-04-29 11:26:46,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +54: [2023-04-29 11:26:46,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +39: [2023-04-29 11:26:46,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 11:26:46,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 11:26:46,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 11:26:46,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +54: [2023-04-29 11:26:46,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 11:26:46,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 11:26:46,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 11:26:46,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +59: [2023-04-29 11:26:46,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 11:26:46,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +44: [2023-04-29 11:26:46,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +37: [2023-04-29 11:26:46,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 11:26:46,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +26: [2023-04-29 11:26:46,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +60: [2023-04-29 11:26:46,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +21: [2023-04-29 11:26:46,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +21: [2023-04-29 11:26:46,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +37: [2023-04-29 11:26:46,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 11:26:46,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +21: [2023-04-29 11:26:46,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +37: [2023-04-29 11:26:46,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +38: [2023-04-29 11:26:46,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +21: [2023-04-29 11:26:46,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +44: [2023-04-29 11:26:46,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 11:26:46,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +37: [2023-04-29 11:26:46,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 11:26:46,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +27: [2023-04-29 11:26:46,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +27: [2023-04-29 11:26:46,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 3: [2023-04-29 11:26:46,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 11:26:46,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +27: [2023-04-29 11:26:46,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +44: [2023-04-29 11:26:46,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 11:26:46,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 11:26:46,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 11:26:46,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +17: [2023-04-29 11:26:46,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +60: [2023-04-29 11:26:46,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 11:26:46,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 11:26:46,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +44: [2023-04-29 11:26:46,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 11:26:46,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 11:26:46,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 0: [2023-04-29 11:26:46,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +56: [2023-04-29 11:26:46,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +60: [2023-04-29 11:26:46,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +26: [2023-04-29 11:26:46,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +55: [2023-04-29 11:26:46,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +44: [2023-04-29 11:26:46,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 11:26:46,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +56: [2023-04-29 11:26:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +60: [2023-04-29 11:26:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 11:26:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 11:26:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 11:26:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +60: [2023-04-29 11:26:46,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +11: [2023-04-29 11:26:46,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 11:26:46,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +17: [2023-04-29 11:26:46,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +47: [2023-04-29 11:26:46,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +37: [2023-04-29 11:26:46,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +47: [2023-04-29 11:26:46,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +57: [2023-04-29 11:26:46,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +57: [2023-04-29 11:26:46,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +17: [2023-04-29 11:26:46,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +17: [2023-04-29 11:26:46,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +51: [2023-04-29 11:26:46,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 11:26:46,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 11:26:46,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +22: [2023-04-29 11:26:46,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +49: [2023-04-29 11:26:46,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 11:26:46,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 11:26:46,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 11:26:46,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:46,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +26: [2023-04-29 11:26:46,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +63: [2023-04-29 11:26:46,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 11:26:46,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 11:26:46,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +26: [2023-04-29 11:26:46,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 11:26:46,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +54: [2023-04-29 11:26:46,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +22: [2023-04-29 11:26:46,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +47: [2023-04-29 11:26:46,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +60: [2023-04-29 11:26:46,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +55: [2023-04-29 11:26:46,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +46: [2023-04-29 11:26:46,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 11:26:46,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 11:26:46,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +31: [2023-04-29 11:26:46,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +57: [2023-04-29 11:26:46,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +17: [2023-04-29 11:26:46,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +60: [2023-04-29 11:26:46,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +30: [2023-04-29 11:26:46,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +54: [2023-04-29 11:26:46,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 11:26:46,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 11:26:46,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 11:26:46,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +57: [2023-04-29 11:26:46,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +57: [2023-04-29 11:26:46,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +31: [2023-04-29 11:26:46,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 11:26:46,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +60: [2023-04-29 11:26:46,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +19: [2023-04-29 11:26:46,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +57: [2023-04-29 11:26:46,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +17: [2023-04-29 11:26:46,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +51: [2023-04-29 11:26:46,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 11:26:46,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +17: [2023-04-29 11:26:46,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +60: [2023-04-29 11:26:46,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 11:26:46,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +22: [2023-04-29 11:26:46,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +26: [2023-04-29 11:26:46,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +19: [2023-04-29 11:26:46,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +11: [2023-04-29 11:26:46,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +10: [2023-04-29 11:26:46,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +22: [2023-04-29 11:26:46,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +24: [2023-04-29 11:26:46,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 11:26:46,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +59: [2023-04-29 11:26:46,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +31: [2023-04-29 11:26:46,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +34: [2023-04-29 11:26:46,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 11:26:46,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 11:26:46,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 11:26:46,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +34: [2023-04-29 11:26:46,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +24: [2023-04-29 11:26:46,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 11:26:46,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +42: [2023-04-29 11:26:46,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 11:26:46,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +11: [2023-04-29 11:26:46,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 11:26:46,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 11:26:46,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +39: [2023-04-29 11:26:46,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +39: [2023-04-29 11:26:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +39: [2023-04-29 11:26:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +39: [2023-04-29 11:26:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +51: [2023-04-29 11:26:46,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 11:26:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 5: [2023-04-29 11:26:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 5: [2023-04-29 11:26:46,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. + 5: [2023-04-29 11:26:46,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +25: [2023-04-29 11:26:46,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +25: [2023-04-29 11:26:46,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +37: [2023-04-29 11:26:46,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 11:26:46,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +25: [2023-04-29 11:26:46,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +25: [2023-04-29 11:26:46,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +62: [2023-04-29 11:26:46,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 11:26:46,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +38: [2023-04-29 11:26:46,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +38: [2023-04-29 11:26:46,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +62: [2023-04-29 11:26:46,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 11:26:46,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 11:26:46,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +52: [2023-04-29 11:26:46,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +59: [2023-04-29 11:26:46,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +19: [2023-04-29 11:26:46,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +19: [2023-04-29 11:26:46,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +49: [2023-04-29 11:26:46,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +21: [2023-04-29 11:26:46,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +59: [2023-04-29 11:26:46,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +59: [2023-04-29 11:26:46,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +55: [2023-04-29 11:26:46,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 11:26:46,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 11:26:46,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +51: [2023-04-29 11:26:46,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 11:26:46,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +59: [2023-04-29 11:26:46,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 11:26:46,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +47: [2023-04-29 11:26:46,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 11:26:46,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 11:26:46,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +52: [2023-04-29 11:26:46,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +27: [2023-04-29 11:26:46,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +35: [2023-04-29 11:26:46,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +10: [2023-04-29 11:26:46,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +10: [2023-04-29 11:26:46,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +10: [2023-04-29 11:26:46,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +27: [2023-04-29 11:26:46,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +62: [2023-04-29 11:26:46,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +10: [2023-04-29 11:26:46,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +54: [2023-04-29 11:26:46,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +27: [2023-04-29 11:26:46,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +27: [2023-04-29 11:26:46,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 11:26:46,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 11:26:46,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +21: [2023-04-29 11:26:46,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +46: [2023-04-29 11:26:46,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +62: [2023-04-29 11:26:46,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +56: [2023-04-29 11:26:46,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +62: [2023-04-29 11:26:46,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +30: [2023-04-29 11:26:46,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +63: [2023-04-29 11:26:46,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +42: [2023-04-29 11:26:46,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 11:26:46,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 11:26:46,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 11:26:46,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +42: [2023-04-29 11:26:46,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +42: [2023-04-29 11:26:46,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +42: [2023-04-29 11:26:46,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +62: [2023-04-29 11:26:46,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +57: [2023-04-29 11:26:46,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 11:26:46,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +62: [2023-04-29 11:26:46,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 11:26:46,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +62: [2023-04-29 11:26:46,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +57: [2023-04-29 11:26:46,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 11:26:46,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 11:26:46,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 11:26:46,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +55: [2023-04-29 11:26:46,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 11:26:46,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +42: [2023-04-29 11:26:46,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +46: [2023-04-29 11:26:46,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 11:26:46,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +42: [2023-04-29 11:26:46,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +46: [2023-04-29 11:26:46,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 11:26:46,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +58: [2023-04-29 11:26:46,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +30: [2023-04-29 11:26:46,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +58: [2023-04-29 11:26:46,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +58: [2023-04-29 11:26:46,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +57: [2023-04-29 11:26:46,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 11:26:46,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +13: [2023-04-29 11:26:46,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +54: [2023-04-29 11:26:46,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 11:26:46,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +52: [2023-04-29 11:26:46,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +19: [2023-04-29 11:26:46,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +55: [2023-04-29 11:26:46,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 11:26:46,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +52: [2023-04-29 11:26:46,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +52: [2023-04-29 11:26:46,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +49: [2023-04-29 11:26:46,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 11:26:46,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +63: [2023-04-29 11:26:46,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +63: [2023-04-29 11:26:46,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +57: [2023-04-29 11:26:46,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +57: [2023-04-29 11:26:46,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +54: [2023-04-29 11:26:46,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +13: [2023-04-29 11:26:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +55: [2023-04-29 11:26:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 11:26:46,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 11:26:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +46: [2023-04-29 11:26:46,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 11:26:46,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +41: [2023-04-29 11:26:46,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +57: [2023-04-29 11:26:46,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +19: [2023-04-29 11:26:46,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +57: [2023-04-29 11:26:46,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +16: [2023-04-29 11:26:46,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +52: [2023-04-29 11:26:46,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +16: [2023-04-29 11:26:46,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +63: [2023-04-29 11:26:46,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 11:26:46,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +35: [2023-04-29 11:26:46,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +35: [2023-04-29 11:26:46,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +13: [2023-04-29 11:26:46,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +41: [2023-04-29 11:26:46,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +30: [2023-04-29 11:26:46,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 11:26:46,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +39: [2023-04-29 11:26:46,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 11:26:46,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +55: [2023-04-29 11:26:46,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +47: [2023-04-29 11:26:46,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +25: [2023-04-29 11:26:46,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +25: [2023-04-29 11:26:46,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +19: [2023-04-29 11:26:46,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +13: [2023-04-29 11:26:46,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +35: [2023-04-29 11:26:46,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 11:26:46,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 11:26:46,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 11:26:46,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 11:26:46,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +47: [2023-04-29 11:26:46,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 11:26:46,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +41: [2023-04-29 11:26:46,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +51: [2023-04-29 11:26:46,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +15: [2023-04-29 11:26:46,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 11:26:46,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 11:26:46,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 11:26:46,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 11:26:46,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +54: [2023-04-29 11:26:46,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 11:26:46,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +13: [2023-04-29 11:26:46,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +35: [2023-04-29 11:26:46,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 5: [2023-04-29 11:26:46,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +46: [2023-04-29 11:26:46,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +13: [2023-04-29 11:26:46,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +47: [2023-04-29 11:26:46,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 11:26:46,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +52: [2023-04-29 11:26:46,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +13: [2023-04-29 11:26:46,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +55: [2023-04-29 11:26:46,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +15: [2023-04-29 11:26:46,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 11:26:46,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 11:26:46,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +38: [2023-04-29 11:26:46,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +52: [2023-04-29 11:26:46,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +30: [2023-04-29 11:26:46,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 11:26:46,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +46: [2023-04-29 11:26:46,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +38: [2023-04-29 11:26:46,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +54: [2023-04-29 11:26:46,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +28: [2023-04-29 11:26:46,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +54: [2023-04-29 11:26:46,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 11:26:46,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +18: [2023-04-29 11:26:46,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 11:26:46,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 11:26:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 11:26:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 11:26:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 11:26:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 11:26:46,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +18: [2023-04-29 11:26:46,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 11:26:46,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 11:26:46,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 11:26:46,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +16: [2023-04-29 11:26:46,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +55: [2023-04-29 11:26:46,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +30: [2023-04-29 11:26:46,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +16: [2023-04-29 11:26:46,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +10: [2023-04-29 11:26:46,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 11:26:46,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +60: [2023-04-29 11:26:46,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +60: [2023-04-29 11:26:46,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 11:26:46,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +42: [2023-04-29 11:26:46,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +12: [2023-04-29 11:26:46,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 11:26:46,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 11:26:46,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 11:26:46,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 11:26:46,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +18: [2023-04-29 11:26:46,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 11:26:46,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 11:26:46,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +42: [2023-04-29 11:26:46,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +28: [2023-04-29 11:26:46,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +46: [2023-04-29 11:26:46,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +12: [2023-04-29 11:26:46,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 11:26:46,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +55: [2023-04-29 11:26:46,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +42: [2023-04-29 11:26:46,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +19: [2023-04-29 11:26:46,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +52: [2023-04-29 11:26:46,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 4: [2023-04-29 11:26:46,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 3: [2023-04-29 11:26:46,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +44: [2023-04-29 11:26:46,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +44: [2023-04-29 11:26:46,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +42: [2023-04-29 11:26:46,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +60: [2023-04-29 11:26:46,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +60: [2023-04-29 11:26:46,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +28: [2023-04-29 11:26:46,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +22: [2023-04-29 11:26:46,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +58: [2023-04-29 11:26:46,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +60: [2023-04-29 11:26:46,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 4: [2023-04-29 11:26:46,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +58: [2023-04-29 11:26:46,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 2: [2023-04-29 11:26:46,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +58: [2023-04-29 11:26:46,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +10: [2023-04-29 11:26:46,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 11:26:46,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +10: [2023-04-29 11:26:46,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +10: [2023-04-29 11:26:46,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +54: [2023-04-29 11:26:46,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +44: [2023-04-29 11:26:46,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 11:26:46,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +46: [2023-04-29 11:26:46,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +28: [2023-04-29 11:26:46,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +55: [2023-04-29 11:26:46,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 3: [2023-04-29 11:26:46,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +47: [2023-04-29 11:26:46,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 11:26:46,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +11: [2023-04-29 11:26:46,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +52: [2023-04-29 11:26:46,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +44: [2023-04-29 11:26:46,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +52: [2023-04-29 11:26:46,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +22: [2023-04-29 11:26:46,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +55: [2023-04-29 11:26:46,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 11:26:46,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +52: [2023-04-29 11:26:46,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +31: [2023-04-29 11:26:46,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +41: [2023-04-29 11:26:46,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 11:26:46,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +27: [2023-04-29 11:26:46,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 11:26:46,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 11:26:46,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 11:26:46,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 11:26:46,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 11:26:46,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 11:26:46,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 11:26:46,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +29: [2023-04-29 11:26:46,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +54: [2023-04-29 11:26:46,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 1: [2023-04-29 11:26:46,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 11:26:46,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +54: [2023-04-29 11:26:46,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 11:26:46,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 11:26:46,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +46: [2023-04-29 11:26:46,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +46: [2023-04-29 11:26:46,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +60: [2023-04-29 11:26:46,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 11:26:46,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +47: [2023-04-29 11:26:46,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +41: [2023-04-29 11:26:46,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 11:26:46,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:46,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:46,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 3: [2023-04-29 11:26:46,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 6: [2023-04-29 11:26:46,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +29: [2023-04-29 11:26:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 11:26:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +29: [2023-04-29 11:26:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 11:26:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +11: [2023-04-29 11:26:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +29: [2023-04-29 11:26:46,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +47: [2023-04-29 11:26:46,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +29: [2023-04-29 11:26:46,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 11:26:46,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +27: [2023-04-29 11:26:46,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 11:26:46,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 11:26:46,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +47: [2023-04-29 11:26:46,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +55: [2023-04-29 11:26:46,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +27: [2023-04-29 11:26:46,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 11:26:46,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +54: [2023-04-29 11:26:46,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 1: [2023-04-29 11:26:46,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 11:26:46,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +22: [2023-04-29 11:26:46,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +54: [2023-04-29 11:26:46,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 1: [2023-04-29 11:26:46,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 11:26:46,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +31: [2023-04-29 11:26:46,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 11:26:46,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 11:26:46,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +46: [2023-04-29 11:26:46,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +46: [2023-04-29 11:26:46,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +60: [2023-04-29 11:26:46,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +47: [2023-04-29 11:26:46,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +50: [2023-04-29 11:26:46,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +50: [2023-04-29 11:26:46,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +12: [2023-04-29 11:26:46,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +47: [2023-04-29 11:26:46,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 11:26:46,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +47: [2023-04-29 11:26:46,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +12: [2023-04-29 11:26:46,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +12: [2023-04-29 11:26:46,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +12: [2023-04-29 11:26:46,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +50: [2023-04-29 11:26:46,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +50: [2023-04-29 11:26:46,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. + 0: [2023-04-29 11:26:46,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +22: [2023-04-29 11:26:46,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +22: [2023-04-29 11:26:46,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +21: [2023-04-29 11:26:46,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 11:26:46,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +31: [2023-04-29 11:26:46,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +60: [2023-04-29 11:26:46,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +31: [2023-04-29 11:26:46,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +47: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +31: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +35: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +35: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +35: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +35: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +60: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 11:26:46,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 11:26:46,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 11:26:46,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 11:26:46,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 11:26:46,976] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 11:26:46,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +45: [2023-04-29 11:26:46,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +22: [2023-04-29 11:26:46,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +45: [2023-04-29 11:26:46,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +45: [2023-04-29 11:26:46,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +25: [2023-04-29 11:26:46,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 11:26:46,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 11:26:46,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +21: [2023-04-29 11:26:46,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 9: [2023-04-29 11:26:46,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 11:26:46,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 11:26:46,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 11:26:46,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 11:26:46,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +33: [2023-04-29 11:26:46,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +33: [2023-04-29 11:26:46,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 0: [2023-04-29 11:26:46,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +11: [2023-04-29 11:26:46,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +27: [2023-04-29 11:26:46,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 9: [2023-04-29 11:26:46,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:46,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +33: [2023-04-29 11:26:46,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 9: [2023-04-29 11:26:46,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 9: [2023-04-29 11:26:46,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 9: [2023-04-29 11:26:46,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 11:26:46,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +22: [2023-04-29 11:26:46,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +25: [2023-04-29 11:26:46,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 11:26:46,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 11:26:46,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 11:26:46,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 11:26:46,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +47: [2023-04-29 11:26:46,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +21: [2023-04-29 11:26:46,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +60: [2023-04-29 11:26:46,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +24: [2023-04-29 11:26:46,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 11:26:46,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 11:26:46,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 11:26:46,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 11:26:46,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +27: [2023-04-29 11:26:46,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +24: [2023-04-29 11:26:46,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 11:26:46,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 11:26:46,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 11:26:46,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 11:26:46,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 11:26:46,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +21: [2023-04-29 11:26:46,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +11: [2023-04-29 11:26:46,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 5: [2023-04-29 11:26:46,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +17: [2023-04-29 11:26:46,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +17: [2023-04-29 11:26:46,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +17: [2023-04-29 11:26:46,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 11:26:46,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 11:26:46,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 11:26:46,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 11:26:46,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +11: [2023-04-29 11:26:46,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +47: [2023-04-29 11:26:46,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +24: [2023-04-29 11:26:46,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 11:26:46,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 11:26:46,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +21: [2023-04-29 11:26:46,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +12: [2023-04-29 11:26:46,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 11:26:46,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +41: [2023-04-29 11:26:46,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +57: [2023-04-29 11:26:46,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +57: [2023-04-29 11:26:46,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +24: [2023-04-29 11:26:46,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +41: [2023-04-29 11:26:46,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +41: [2023-04-29 11:26:46,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +17: [2023-04-29 11:26:46,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 11:26:46,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 11:26:46,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 11:26:46,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +41: [2023-04-29 11:26:46,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. + 5: [2023-04-29 11:26:46,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +24: [2023-04-29 11:26:46,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +57: [2023-04-29 11:26:46,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +21: [2023-04-29 11:26:46,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +17: [2023-04-29 11:26:46,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 11:26:46,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +21: [2023-04-29 11:26:46,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +24: [2023-04-29 11:26:46,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +12: [2023-04-29 11:26:46,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +57: [2023-04-29 11:26:46,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +39: [2023-04-29 11:26:46,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 11:26:46,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 11:26:46,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +50: [2023-04-29 11:26:46,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 11:26:47,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +25: [2023-04-29 11:26:47,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +25: [2023-04-29 11:26:47,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +50: [2023-04-29 11:26:47,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:47,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +57: [2023-04-29 11:26:47,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +57: [2023-04-29 11:26:47,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +57: [2023-04-29 11:26:47,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +12: [2023-04-29 11:26:47,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 11:26:47,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +57: [2023-04-29 11:26:47,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +39: [2023-04-29 11:26:47,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +35: [2023-04-29 11:26:47,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 11:26:47,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 11:26:47,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +15: [2023-04-29 11:26:47,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +45: [2023-04-29 11:26:47,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 11:26:47,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 11:26:47,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +10: [2023-04-29 11:26:47,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 11:26:47,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 11:26:47,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 11:26:47,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +35: [2023-04-29 11:26:47,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 11:26:47,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +25: [2023-04-29 11:26:47,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +25: [2023-04-29 11:26:47,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +35: [2023-04-29 11:26:47,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +39: [2023-04-29 11:26:47,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +39: [2023-04-29 11:26:47,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 11:26:47,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 11:26:47,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +15: [2023-04-29 11:26:47,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +45: [2023-04-29 11:26:47,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 11:26:47,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +25: [2023-04-29 11:26:47,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +18: [2023-04-29 11:26:47,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 11:26:47,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +15: [2023-04-29 11:26:47,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +23: [2023-04-29 11:26:47,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +23: [2023-04-29 11:26:47,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +23: [2023-04-29 11:26:47,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +15: [2023-04-29 11:26:47,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +15: [2023-04-29 11:26:47,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +15: [2023-04-29 11:26:47,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +35: [2023-04-29 11:26:47,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +23: [2023-04-29 11:26:47,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +60: [2023-04-29 11:26:47,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +15: [2023-04-29 11:26:47,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +45: [2023-04-29 11:26:47,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +45: [2023-04-29 11:26:47,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 11:26:47,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +10: [2023-04-29 11:26:47,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +58: [2023-04-29 11:26:47,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 11:26:47,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 11:26:47,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +38: [2023-04-29 11:26:47,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +38: [2023-04-29 11:26:47,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +25: [2023-04-29 11:26:47,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... + 5: [2023-04-29 11:26:47,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +58: [2023-04-29 11:26:47,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +42: [2023-04-29 11:26:47,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +39: [2023-04-29 11:26:47,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +39: [2023-04-29 11:26:47,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +12: [2023-04-29 11:26:47,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +15: [2023-04-29 11:26:47,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +45: [2023-04-29 11:26:47,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 11:26:47,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +52: [2023-04-29 11:26:47,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +38: [2023-04-29 11:26:47,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +45: [2023-04-29 11:26:47,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 7: [2023-04-29 11:26:47,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +25: [2023-04-29 11:26:47,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +42: [2023-04-29 11:26:47,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +58: [2023-04-29 11:26:47,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 7: [2023-04-29 11:26:47,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +42: [2023-04-29 11:26:47,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +18: [2023-04-29 11:26:47,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 11:26:47,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +38: [2023-04-29 11:26:47,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +29: [2023-04-29 11:26:47,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +52: [2023-04-29 11:26:47,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 11:26:47,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +48: [2023-04-29 11:26:47,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +10: [2023-04-29 11:26:47,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 11:26:47,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 11:26:47,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +58: [2023-04-29 11:26:47,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 11:26:47,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +48: [2023-04-29 11:26:47,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 11:26:47,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +18: [2023-04-29 11:26:47,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +18: [2023-04-29 11:26:47,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +52: [2023-04-29 11:26:47,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +18: [2023-04-29 11:26:47,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +18: [2023-04-29 11:26:47,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +41: [2023-04-29 11:26:47,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +12: [2023-04-29 11:26:47,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +42: [2023-04-29 11:26:47,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +41: [2023-04-29 11:26:47,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +42: [2023-04-29 11:26:47,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +41: [2023-04-29 11:26:47,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +52: [2023-04-29 11:26:47,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +52: [2023-04-29 11:26:47,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +58: [2023-04-29 11:26:47,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +48: [2023-04-29 11:26:47,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 11:26:47,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 11:26:47,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +58: [2023-04-29 11:26:47,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +41: [2023-04-29 11:26:47,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +10: [2023-04-29 11:26:47,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +10: [2023-04-29 11:26:47,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +14: [2023-04-29 11:26:47,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 11:26:47,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 11:26:47,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +52: [2023-04-29 11:26:47,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +14: [2023-04-29 11:26:47,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +48: [2023-04-29 11:26:47,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 11:26:47,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +48: [2023-04-29 11:26:47,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +18: [2023-04-29 11:26:47,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +52: [2023-04-29 11:26:47,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +12: [2023-04-29 11:26:47,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +58: [2023-04-29 11:26:47,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +27: [2023-04-29 11:26:47,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 11:26:47,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 11:26:47,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +33: [2023-04-29 11:26:47,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 11:26:47,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +29: [2023-04-29 11:26:47,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +29: [2023-04-29 11:26:47,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 11:26:47,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 11:26:47,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 11:26:47,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 11:26:47,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 11:26:47,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 11:26:47,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 11:26:47,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 11:26:47,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 11:26:47,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 11:26:47,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 11:26:47,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 11:26:47,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 11:26:47,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 11:26:47,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 11:26:47,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 11:26:47,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 11:26:47,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 11:26:47,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 11:26:47,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +32: [2023-04-29 11:26:47,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +32: [2023-04-29 11:26:47,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +23: [2023-04-29 11:26:47,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 11:26:47,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 11:26:47,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +32: [2023-04-29 11:26:47,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +15: [2023-04-29 11:26:47,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +32: [2023-04-29 11:26:47,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 7: [2023-04-29 11:26:47,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 11:26:47,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 11:26:47,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +15: [2023-04-29 11:26:47,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 11:26:47,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 11:26:47,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 11:26:47,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 11:26:47,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 11:26:47,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:47,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +15: [2023-04-29 11:26:47,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +17: [2023-04-29 11:26:47,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 11:26:47,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +18: [2023-04-29 11:26:47,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:47,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 11:26:47,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +25: [2023-04-29 11:26:47,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 11:26:47,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +63: [2023-04-29 11:26:47,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +63: [2023-04-29 11:26:47,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +63: [2023-04-29 11:26:47,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. + 9: [2023-04-29 11:26:47,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +18: [2023-04-29 11:26:47,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 11:26:47,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +17: [2023-04-29 11:26:47,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 11:26:47,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +24: [2023-04-29 11:26:47,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 11:26:47,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 11:26:47,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:47,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +13: [2023-04-29 11:26:47,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 11:26:47,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 11:26:47,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 11:26:47,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 11:26:47,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 11:26:47,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 11:26:47,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 11:26:47,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +29: [2023-04-29 11:26:47,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +40: [2023-04-29 11:26:47,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +29: [2023-04-29 11:26:47,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +40: [2023-04-29 11:26:47,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +40: [2023-04-29 11:26:47,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +40: [2023-04-29 11:26:47,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +17: [2023-04-29 11:26:47,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 11:26:47,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 11:26:47,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 11:26:47,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +35: [2023-04-29 11:26:47,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +20: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +24: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +13: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +27: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +50: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +27: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_12-model_01-model_states.pt. +27: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 11:26:47,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 11:26:47,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +43: [2023-04-29 11:26:47,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +43: [2023-04-29 11:26:47,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 1: [2023-04-29 11:26:47,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +43: [2023-04-29 11:26:47,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +13: [2023-04-29 11:26:47,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +43: [2023-04-29 11:26:47,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 8: [2023-04-29 11:26:47,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 11:26:47,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 11:26:47,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 11:26:47,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 11:26:47,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 11:26:47,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +50: [2023-04-29 11:26:47,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 11:26:47,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 11:26:47,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +25: [2023-04-29 11:26:47,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 11:26:47,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +17: [2023-04-29 11:26:47,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 11:26:47,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 11:26:47,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 11:26:47,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +50: [2023-04-29 11:26:47,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +50: [2023-04-29 11:26:47,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +22: [2023-04-29 11:26:47,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 11:26:47,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 11:26:47,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +33: [2023-04-29 11:26:47,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +33: [2023-04-29 11:26:47,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +32: [2023-04-29 11:26:47,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +22: [2023-04-29 11:26:47,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:47,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +12: [2023-04-29 11:26:47,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +33: [2023-04-29 11:26:47,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +28: [2023-04-29 11:26:47,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 11:26:47,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 11:26:47,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +50: [2023-04-29 11:26:47,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +50: [2023-04-29 11:26:47,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +25: [2023-04-29 11:26:47,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +32: [2023-04-29 11:26:47,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 11:26:47,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +12: [2023-04-29 11:26:47,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +35: [2023-04-29 11:26:47,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 3: [2023-04-29 11:26:47,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +45: [2023-04-29 11:26:47,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 11:26:47,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +17: [2023-04-29 11:26:47,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +45: [2023-04-29 11:26:47,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +45: [2023-04-29 11:26:47,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 11:26:47,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +24: [2023-04-29 11:26:47,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 11:26:47,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 11:26:47,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +17: [2023-04-29 11:26:47,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 11:26:47,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 3: [2023-04-29 11:26:47,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +32: [2023-04-29 11:26:47,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +41: [2023-04-29 11:26:47,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +45: [2023-04-29 11:26:47,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +24: [2023-04-29 11:26:47,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 11:26:47,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +25: [2023-04-29 11:26:47,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +45: [2023-04-29 11:26:47,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 3: [2023-04-29 11:26:47,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 11:26:47,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +49: [2023-04-29 11:26:47,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +49: [2023-04-29 11:26:47,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +26: [2023-04-29 11:26:47,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 11:26:47,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 11:26:47,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +45: [2023-04-29 11:26:47,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +49: [2023-04-29 11:26:47,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +49: [2023-04-29 11:26:47,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +63: [2023-04-29 11:26:47,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +35: [2023-04-29 11:26:47,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +63: [2023-04-29 11:26:47,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +41: [2023-04-29 11:26:47,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +35: [2023-04-29 11:26:47,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +40: [2023-04-29 11:26:47,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +33: [2023-04-29 11:26:47,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 11:26:47,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +41: [2023-04-29 11:26:47,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +40: [2023-04-29 11:26:47,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 11:26:47,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 11:26:47,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 11:26:47,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +12: [2023-04-29 11:26:47,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +40: [2023-04-29 11:26:47,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +40: [2023-04-29 11:26:47,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:47,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +56: [2023-04-29 11:26:47,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +20: [2023-04-29 11:26:47,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +40: [2023-04-29 11:26:47,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +20: [2023-04-29 11:26:47,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 11:26:47,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +40: [2023-04-29 11:26:47,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:47,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +35: [2023-04-29 11:26:47,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +26: [2023-04-29 11:26:47,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 11:26:47,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +26: [2023-04-29 11:26:47,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +48: [2023-04-29 11:26:47,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 11:26:47,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +26: [2023-04-29 11:26:47,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +45: [2023-04-29 11:26:47,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +48: [2023-04-29 11:26:47,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 11:26:47,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:47,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +56: [2023-04-29 11:26:47,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +45: [2023-04-29 11:26:47,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 11:26:47,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +12: [2023-04-29 11:26:47,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +56: [2023-04-29 11:26:47,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_34-model_01-model_states.pt. +40: [2023-04-29 11:26:47,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +12: [2023-04-29 11:26:47,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +20: [2023-04-29 11:26:47,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +15: [2023-04-29 11:26:47,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 11:26:47,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +43: [2023-04-29 11:26:47,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +43: [2023-04-29 11:26:47,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 11:26:47,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +40: [2023-04-29 11:26:47,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +43: [2023-04-29 11:26:47,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +24: [2023-04-29 11:26:47,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +40: [2023-04-29 11:26:47,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:47,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +20: [2023-04-29 11:26:47,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt... +17: [2023-04-29 11:26:47,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +41: [2023-04-29 11:26:47,100] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +33: [2023-04-29 11:26:47,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +12: [2023-04-29 11:26:47,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +15: [2023-04-29 11:26:47,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +24: [2023-04-29 11:26:47,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +48: [2023-04-29 11:26:47,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +48: [2023-04-29 11:26:47,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 11:26:47,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +23: [2023-04-29 11:26:47,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +41: [2023-04-29 11:26:47,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +23: [2023-04-29 11:26:47,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +45: [2023-04-29 11:26:47,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +33: [2023-04-29 11:26:47,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +33: [2023-04-29 11:26:47,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +33: [2023-04-29 11:26:47,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +18: [2023-04-29 11:26:47,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 11:26:47,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +45: [2023-04-29 11:26:47,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +49: [2023-04-29 11:26:47,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +23: [2023-04-29 11:26:47,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +14: [2023-04-29 11:26:47,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 11:26:47,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 11:26:47,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 11:26:47,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 11:26:47,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 7: [2023-04-29 11:26:47,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +49: [2023-04-29 11:26:47,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +49: [2023-04-29 11:26:47,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +18: [2023-04-29 11:26:47,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 7: [2023-04-29 11:26:47,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +58: [2023-04-29 11:26:47,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 11:26:47,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +15: [2023-04-29 11:26:47,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +58: [2023-04-29 11:26:47,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 11:26:47,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 11:26:47,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 11:26:47,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 11:26:47,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 11:26:47,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +23: [2023-04-29 11:26:47,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +23: [2023-04-29 11:26:47,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 7: [2023-04-29 11:26:47,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +23: [2023-04-29 11:26:47,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +53: [2023-04-29 11:26:47,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +15: [2023-04-29 11:26:47,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 11:26:47,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +50: [2023-04-29 11:26:47,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 11:26:47,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 11:26:47,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +61: [2023-04-29 11:26:47,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 11:26:47,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 11:26:47,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 11:26:47,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 11:26:47,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +23: [2023-04-29 11:26:47,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 11:26:47,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +48: [2023-04-29 11:26:47,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +23: [2023-04-29 11:26:47,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +56: [2023-04-29 11:26:47,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +48: [2023-04-29 11:26:47,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 11:26:47,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +58: [2023-04-29 11:26:47,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 11:26:47,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 11:26:47,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +53: [2023-04-29 11:26:47,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +53: [2023-04-29 11:26:47,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +53: [2023-04-29 11:26:47,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +36: [2023-04-29 11:26:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 11:26:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 11:26:47,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 11:26:47,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +15: [2023-04-29 11:26:47,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +36: [2023-04-29 11:26:47,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 11:26:47,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +53: [2023-04-29 11:26:47,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 11:26:47,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 11:26:47,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +18: [2023-04-29 11:26:47,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +61: [2023-04-29 11:26:47,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 11:26:47,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +15: [2023-04-29 11:26:47,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +15: [2023-04-29 11:26:47,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 7: [2023-04-29 11:26:47,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +14: [2023-04-29 11:26:47,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 11:26:47,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +36: [2023-04-29 11:26:47,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 11:26:47,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 11:26:47,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 11:26:47,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +36: [2023-04-29 11:26:47,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +36: [2023-04-29 11:26:47,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 11:26:47,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +36: [2023-04-29 11:26:47,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +28: [2023-04-29 11:26:47,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +32: [2023-04-29 11:26:47,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 11:26:47,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 11:26:47,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 11:26:47,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +18: [2023-04-29 11:26:47,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +50: [2023-04-29 11:26:47,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +18: [2023-04-29 11:26:47,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +22: [2023-04-29 11:26:47,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +45: [2023-04-29 11:26:47,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +13: [2023-04-29 11:26:47,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 11:26:47,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 11:26:47,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 11:26:47,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +56: [2023-04-29 11:26:47,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt... +31: [2023-04-29 11:26:47,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 11:26:47,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +48: [2023-04-29 11:26:47,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +13: [2023-04-29 11:26:47,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 11:26:47,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +13: [2023-04-29 11:26:47,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +48: [2023-04-29 11:26:47,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +22: [2023-04-29 11:26:47,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 11:26:47,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +28: [2023-04-29 11:26:47,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 11:26:47,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 11:26:47,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 11:26:47,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 11:26:47,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +32: [2023-04-29 11:26:47,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +32: [2023-04-29 11:26:47,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +32: [2023-04-29 11:26:47,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +32: [2023-04-29 11:26:47,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +32: [2023-04-29 11:26:47,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +22: [2023-04-29 11:26:47,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 11:26:47,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 11:26:47,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 11:26:47,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 11:26:47,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +32: [2023-04-29 11:26:47,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +14: [2023-04-29 11:26:47,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 11:26:47,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 11:26:47,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +40: [2023-04-29 11:26:47,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 11:26:47,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +23: [2023-04-29 11:26:47,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 11:26:47,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 11:26:47,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +40: [2023-04-29 11:26:47,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 8: [2023-04-29 11:26:47,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +63: [2023-04-29 11:26:47,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +63: [2023-04-29 11:26:47,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +28: [2023-04-29 11:26:47,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 11:26:47,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +20: [2023-04-29 11:26:47,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 11:26:47,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 11:26:47,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +11: [2023-04-29 11:26:47,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 11:26:47,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 11:26:47,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 11:26:47,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 11:26:47,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +63: [2023-04-29 11:26:47,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +22: [2023-04-29 11:26:47,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +43: [2023-04-29 11:26:47,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +20: [2023-04-29 11:26:47,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +40: [2023-04-29 11:26:47,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +26: [2023-04-29 11:26:47,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 11:26:47,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 11:26:47,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 11:26:47,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 11:26:47,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +43: [2023-04-29 11:26:47,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 11:26:47,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +13: [2023-04-29 11:26:47,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 11:26:47,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +63: [2023-04-29 11:26:47,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +11: [2023-04-29 11:26:47,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 11:26:47,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 11:26:47,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 11:26:47,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 11:26:47,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 11:26:47,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 11:26:47,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +49: [2023-04-29 11:26:47,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +20: [2023-04-29 11:26:47,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +20: [2023-04-29 11:26:47,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +21: [2023-04-29 11:26:47,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 11:26:47,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 11:26:47,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 11:26:47,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +43: [2023-04-29 11:26:47,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +11: [2023-04-29 11:26:47,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 11:26:47,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +33: [2023-04-29 11:26:47,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 11:26:47,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 11:26:47,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +20: [2023-04-29 11:26:47,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +43: [2023-04-29 11:26:47,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 5: [2023-04-29 11:26:47,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +40: [2023-04-29 11:26:47,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 11:26:47,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 11:26:47,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 11:26:47,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +20: [2023-04-29 11:26:47,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. +21: [2023-04-29 11:26:47,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 11:26:47,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 11:26:47,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 11:26:47,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +40: [2023-04-29 11:26:47,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 11:26:47,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +43: [2023-04-29 11:26:47,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 2: [2023-04-29 11:26:47,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 11:26:47,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:47,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 5: [2023-04-29 11:26:47,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 11:26:47,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 11:26:47,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +22: [2023-04-29 11:26:47,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +40: [2023-04-29 11:26:47,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +40: [2023-04-29 11:26:47,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +48: [2023-04-29 11:26:47,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +48: [2023-04-29 11:26:47,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +40: [2023-04-29 11:26:47,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +40: [2023-04-29 11:26:47,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +48: [2023-04-29 11:26:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +28: [2023-04-29 11:26:47,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +48: [2023-04-29 11:26:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 2: [2023-04-29 11:26:47,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +32: [2023-04-29 11:26:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 11:26:47,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 11:26:47,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +20: [2023-04-29 11:26:47,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +34: [2023-04-29 11:26:47,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +34: [2023-04-29 11:26:47,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 2: [2023-04-29 11:26:47,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +49: [2023-04-29 11:26:47,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt... +34: [2023-04-29 11:26:47,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +34: [2023-04-29 11:26:47,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +40: [2023-04-29 11:26:47,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 11:26:47,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 11:26:47,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +49: [2023-04-29 11:26:47,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +36: [2023-04-29 11:26:47,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 11:26:47,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +40: [2023-04-29 11:26:47,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 11:26:47,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 11:26:47,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 11:26:47,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +56: [2023-04-29 11:26:47,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +32: [2023-04-29 11:26:47,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +49: [2023-04-29 11:26:47,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +26: [2023-04-29 11:26:47,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +61: [2023-04-29 11:26:47,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 11:26:47,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 11:26:47,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +26: [2023-04-29 11:26:47,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +49: [2023-04-29 11:26:47,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +58: [2023-04-29 11:26:47,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 11:26:47,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +26: [2023-04-29 11:26:47,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +33: [2023-04-29 11:26:47,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +26: [2023-04-29 11:26:47,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +53: [2023-04-29 11:26:47,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 11:26:47,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 11:26:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 11:26:47,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 11:26:47,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +56: [2023-04-29 11:26:47,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +53: [2023-04-29 11:26:47,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 11:26:47,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +56: [2023-04-29 11:26:47,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +50: [2023-04-29 11:26:47,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 11:26:47,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... + 1: [2023-04-29 11:26:47,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 1: [2023-04-29 11:26:47,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +58: [2023-04-29 11:26:47,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 0: [2023-04-29 11:26:47,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 0: [2023-04-29 11:26:47,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 1: [2023-04-29 11:26:47,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 0: [2023-04-29 11:26:47,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 1: [2023-04-29 11:26:47,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +36: [2023-04-29 11:26:47,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 11:26:47,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:47,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +40: [2023-04-29 11:26:47,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +31: [2023-04-29 11:26:47,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +58: [2023-04-29 11:26:47,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 11:26:47,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 11:26:47,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:47,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +50: [2023-04-29 11:26:47,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 11:26:47,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 11:26:47,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +31: [2023-04-29 11:26:47,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 11:26:47,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 11:26:47,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +48: [2023-04-29 11:26:47,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +40: [2023-04-29 11:26:47,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +48: [2023-04-29 11:26:47,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 11:26:47,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 11:26:47,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 11:26:47,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:47,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_00-model_states.pt. +10: [2023-04-29 11:26:47,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +10: [2023-04-29 11:26:47,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +10: [2023-04-29 11:26:47,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +34: [2023-04-29 11:26:47,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 11:26:47,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +36: [2023-04-29 11:26:47,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 8: [2023-04-29 11:26:47,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 8: [2023-04-29 11:26:47,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 8: [2023-04-29 11:26:47,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +40: [2023-04-29 11:26:47,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 11:26:47,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 11:26:47,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 11:26:47,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +10: [2023-04-29 11:26:47,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +61: [2023-04-29 11:26:47,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 11:26:47,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 11:26:47,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt... +10: [2023-04-29 11:26:47,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +38: [2023-04-29 11:26:47,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 11:26:47,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 11:26:47,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 11:26:47,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 11:26:47,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 11:26:47,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 11:26:47,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 11:26:47,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 11:26:47,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +10: [2023-04-29 11:26:47,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +53: [2023-04-29 11:26:47,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 11:26:47,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 11:26:47,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +20: [2023-04-29 11:26:47,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 11:26:47,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +38: [2023-04-29 11:26:47,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 11:26:47,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 11:26:47,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 11:26:47,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +32: [2023-04-29 11:26:47,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 11:26:47,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 11:26:47,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +32: [2023-04-29 11:26:47,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +58: [2023-04-29 11:26:47,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 11:26:47,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +36: [2023-04-29 11:26:47,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +31: [2023-04-29 11:26:47,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +36: [2023-04-29 11:26:47,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 11:26:47,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 11:26:47,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +20: [2023-04-29 11:26:47,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 11:26:47,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 11:26:47,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 11:26:47,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 11:26:47,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +50: [2023-04-29 11:26:47,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +31: [2023-04-29 11:26:47,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 11:26:47,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +14: [2023-04-29 11:26:47,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +31: [2023-04-29 11:26:47,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 11:26:47,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +37: [2023-04-29 11:26:47,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 11:26:47,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +20: [2023-04-29 11:26:47,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 11:26:47,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +37: [2023-04-29 11:26:47,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 11:26:47,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +14: [2023-04-29 11:26:47,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +50: [2023-04-29 11:26:47,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +21: [2023-04-29 11:26:47,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 11:26:47,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 11:26:47,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +50: [2023-04-29 11:26:47,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +37: [2023-04-29 11:26:47,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 11:26:47,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +37: [2023-04-29 11:26:47,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 11:26:47,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 11:26:47,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 11:26:47,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +44: [2023-04-29 11:26:47,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 11:26:47,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 11:26:47,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 11:26:47,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +44: [2023-04-29 11:26:47,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 11:26:47,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 11:26:47,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 11:26:47,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 11:26:47,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 11:26:47,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 11:26:47,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 11:26:47,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 11:26:47,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +21: [2023-04-29 11:26:47,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +20: [2023-04-29 11:26:47,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 11:26:47,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +26: [2023-04-29 11:26:47,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +54: [2023-04-29 11:26:47,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +54: [2023-04-29 11:26:47,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +54: [2023-04-29 11:26:47,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. + 5: [2023-04-29 11:26:47,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +54: [2023-04-29 11:26:47,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +34: [2023-04-29 11:26:47,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 11:26:47,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +14: [2023-04-29 11:26:47,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +11: [2023-04-29 11:26:47,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 11:26:47,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +34: [2023-04-29 11:26:47,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +48: [2023-04-29 11:26:47,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +26: [2023-04-29 11:26:47,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +11: [2023-04-29 11:26:47,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 11:26:47,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 11:26:47,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +32: [2023-04-29 11:26:47,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 11:26:47,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 11:26:47,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +14: [2023-04-29 11:26:47,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +48: [2023-04-29 11:26:47,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +21: [2023-04-29 11:26:47,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 11:26:47,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +20: [2023-04-29 11:26:47,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +48: [2023-04-29 11:26:47,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +21: [2023-04-29 11:26:47,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 11:26:47,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +32: [2023-04-29 11:26:47,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 11:26:47,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +48: [2023-04-29 11:26:47,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +63: [2023-04-29 11:26:47,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 11:26:47,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 11:26:47,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 11:26:47,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +61: [2023-04-29 11:26:47,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +61: [2023-04-29 11:26:47,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +61: [2023-04-29 11:26:47,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +59: [2023-04-29 11:26:47,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 11:26:47,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 11:26:47,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 11:26:47,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +59: [2023-04-29 11:26:47,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +10: [2023-04-29 11:26:47,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +34: [2023-04-29 11:26:47,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 11:26:47,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +48: [2023-04-29 11:26:47,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +63: [2023-04-29 11:26:47,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +63: [2023-04-29 11:26:47,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +10: [2023-04-29 11:26:47,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +63: [2023-04-29 11:26:47,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +57: [2023-04-29 11:26:47,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 11:26:47,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +48: [2023-04-29 11:26:47,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 11:26:47,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 11:26:47,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 11:26:47,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 11:26:47,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 1: [2023-04-29 11:26:47,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +57: [2023-04-29 11:26:47,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +59: [2023-04-29 11:26:47,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +59: [2023-04-29 11:26:47,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 11:26:47,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 11:26:47,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 11:26:47,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +48: [2023-04-29 11:26:47,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +38: [2023-04-29 11:26:47,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 11:26:47,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 11:26:47,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +54: [2023-04-29 11:26:47,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +54: [2023-04-29 11:26:47,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +54: [2023-04-29 11:26:47,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +54: [2023-04-29 11:26:47,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +26: [2023-04-29 11:26:47,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +57: [2023-04-29 11:26:47,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +57: [2023-04-29 11:26:47,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 11:26:47,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +26: [2023-04-29 11:26:47,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +38: [2023-04-29 11:26:47,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +26: [2023-04-29 11:26:47,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +55: [2023-04-29 11:26:47,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 11:26:47,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 11:26:47,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 9: [2023-04-29 11:26:47,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +55: [2023-04-29 11:26:47,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 11:26:47,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +38: [2023-04-29 11:26:47,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 11:26:47,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +59: [2023-04-29 11:26:47,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +59: [2023-04-29 11:26:47,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 9: [2023-04-29 11:26:47,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 1: [2023-04-29 11:26:47,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +55: [2023-04-29 11:26:47,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 11:26:47,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 11:26:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 11:26:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +26: [2023-04-29 11:26:47,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +53: [2023-04-29 11:26:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +53: [2023-04-29 11:26:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +53: [2023-04-29 11:26:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +53: [2023-04-29 11:26:47,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +55: [2023-04-29 11:26:47,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +55: [2023-04-29 11:26:47,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 11:26:47,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 0: [2023-04-29 11:26:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +55: [2023-04-29 11:26:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +61: [2023-04-29 11:26:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 11:26:47,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 11:26:47,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 11:26:47,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +49: [2023-04-29 11:26:47,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +10: [2023-04-29 11:26:47,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +61: [2023-04-29 11:26:47,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 11:26:47,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +61: [2023-04-29 11:26:47,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 11:26:47,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 11:26:47,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 11:26:47,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 11:26:47,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +44: [2023-04-29 11:26:47,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 7: [2023-04-29 11:26:47,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +34: [2023-04-29 11:26:47,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 8: [2023-04-29 11:26:47,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +49: [2023-04-29 11:26:47,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +51: [2023-04-29 11:26:47,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +51: [2023-04-29 11:26:47,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +44: [2023-04-29 11:26:47,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +44: [2023-04-29 11:26:47,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 7: [2023-04-29 11:26:47,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +51: [2023-04-29 11:26:47,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +51: [2023-04-29 11:26:47,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 8: [2023-04-29 11:26:47,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +37: [2023-04-29 11:26:47,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 11:26:47,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 11:26:47,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +37: [2023-04-29 11:26:47,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 11:26:47,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +47: [2023-04-29 11:26:47,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +47: [2023-04-29 11:26:47,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +44: [2023-04-29 11:26:47,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +44: [2023-04-29 11:26:47,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 8: [2023-04-29 11:26:47,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +36: [2023-04-29 11:26:47,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +36: [2023-04-29 11:26:47,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 8: [2023-04-29 11:26:47,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 8: [2023-04-29 11:26:47,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +16: [2023-04-29 11:26:47,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +16: [2023-04-29 11:26:47,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +10: [2023-04-29 11:26:47,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +47: [2023-04-29 11:26:47,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +60: [2023-04-29 11:26:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +60: [2023-04-29 11:26:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +38: [2023-04-29 11:26:47,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 11:26:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +60: [2023-04-29 11:26:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +47: [2023-04-29 11:26:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +36: [2023-04-29 11:26:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +14: [2023-04-29 11:26:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 11:26:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +24: [2023-04-29 11:26:47,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +24: [2023-04-29 11:26:47,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +44: [2023-04-29 11:26:47,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 11:26:47,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 9: [2023-04-29 11:26:47,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +16: [2023-04-29 11:26:47,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +59: [2023-04-29 11:26:47,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +24: [2023-04-29 11:26:47,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +38: [2023-04-29 11:26:47,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +24: [2023-04-29 11:26:47,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 9: [2023-04-29 11:26:47,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 11:26:47,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +30: [2023-04-29 11:26:47,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +14: [2023-04-29 11:26:47,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +53: [2023-04-29 11:26:47,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +53: [2023-04-29 11:26:47,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 11:26:47,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +44: [2023-04-29 11:26:47,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 11:26:47,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 11:26:47,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 11:26:47,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +42: [2023-04-29 11:26:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 11:26:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 11:26:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +37: [2023-04-29 11:26:47,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +30: [2023-04-29 11:26:47,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +42: [2023-04-29 11:26:47,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +30: [2023-04-29 11:26:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +59: [2023-04-29 11:26:47,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 11:26:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 11:26:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +37: [2023-04-29 11:26:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +62: [2023-04-29 11:26:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +62: [2023-04-29 11:26:47,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +62: [2023-04-29 11:26:47,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +62: [2023-04-29 11:26:47,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +14: [2023-04-29 11:26:47,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +53: [2023-04-29 11:26:47,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +53: [2023-04-29 11:26:47,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 11:26:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 11:26:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 11:26:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 11:26:47,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +42: [2023-04-29 11:26:47,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 11:26:47,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 11:26:47,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +14: [2023-04-29 11:26:47,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +44: [2023-04-29 11:26:47,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +14: [2023-04-29 11:26:47,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +59: [2023-04-29 11:26:47,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 11:26:47,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 11:26:47,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +16: [2023-04-29 11:26:47,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 11:26:47,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 11:26:47,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +14: [2023-04-29 11:26:47,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 11:26:47,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 6: [2023-04-29 11:26:47,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 6: [2023-04-29 11:26:47,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 6: [2023-04-29 11:26:47,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +16: [2023-04-29 11:26:47,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 11:26:47,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 11:26:47,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +51: [2023-04-29 11:26:47,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +14: [2023-04-29 11:26:47,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +51: [2023-04-29 11:26:47,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 11:26:47,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +60: [2023-04-29 11:26:47,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 11:26:47,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 11:26:47,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +24: [2023-04-29 11:26:47,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +36: [2023-04-29 11:26:47,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +36: [2023-04-29 11:26:47,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 11:26:47,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +60: [2023-04-29 11:26:47,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 11:26:47,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 11:26:47,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +34: [2023-04-29 11:26:47,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +19: [2023-04-29 11:26:47,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +19: [2023-04-29 11:26:47,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +19: [2023-04-29 11:26:47,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +44: [2023-04-29 11:26:47,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +14: [2023-04-29 11:26:47,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +44: [2023-04-29 11:26:47,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +19: [2023-04-29 11:26:47,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +47: [2023-04-29 11:26:47,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +60: [2023-04-29 11:26:47,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 11:26:47,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 11:26:47,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +60: [2023-04-29 11:26:47,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +57: [2023-04-29 11:26:47,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 11:26:47,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 11:26:47,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 11:26:47,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 11:26:47,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +24: [2023-04-29 11:26:47,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +19: [2023-04-29 11:26:47,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +39: [2023-04-29 11:26:47,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 11:26:47,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 11:26:47,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +10: [2023-04-29 11:26:47,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +10: [2023-04-29 11:26:47,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +19: [2023-04-29 11:26:47,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +16: [2023-04-29 11:26:47,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 11:26:47,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 11:26:47,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +39: [2023-04-29 11:26:47,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 11:26:47,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 11:26:47,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 11:26:47,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +19: [2023-04-29 11:26:47,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +10: [2023-04-29 11:26:47,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +30: [2023-04-29 11:26:47,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +47: [2023-04-29 11:26:47,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +19: [2023-04-29 11:26:47,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +37: [2023-04-29 11:26:47,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 11:26:47,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 4: [2023-04-29 11:26:47,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 4: [2023-04-29 11:26:47,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 4: [2023-04-29 11:26:47,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +37: [2023-04-29 11:26:47,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +26: [2023-04-29 11:26:47,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +34: [2023-04-29 11:26:47,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +24: [2023-04-29 11:26:47,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +24: [2023-04-29 11:26:47,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 11:26:47,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +30: [2023-04-29 11:26:47,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +62: [2023-04-29 11:26:47,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +39: [2023-04-29 11:26:47,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +57: [2023-04-29 11:26:47,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 11:26:47,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +16: [2023-04-29 11:26:47,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +46: [2023-04-29 11:26:47,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 6: [2023-04-29 11:26:47,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 11:26:47,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 11:26:47,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 11:26:47,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 11:26:47,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 11:26:47,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +47: [2023-04-29 11:26:47,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +47: [2023-04-29 11:26:47,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 11:26:47,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 11:26:47,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 11:26:47,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 11:26:47,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +39: [2023-04-29 11:26:47,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 11:26:47,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +46: [2023-04-29 11:26:47,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +57: [2023-04-29 11:26:47,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +26: [2023-04-29 11:26:47,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +26: [2023-04-29 11:26:47,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +59: [2023-04-29 11:26:47,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 11:26:47,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 11:26:47,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 11:26:47,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 11:26:47,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 11:26:47,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 11:26:47,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +55: [2023-04-29 11:26:47,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +47: [2023-04-29 11:26:47,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 11:26:47,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 11:26:47,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 11:26:47,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 11:26:47,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 11:26:47,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 11:26:47,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 11:26:47,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +46: [2023-04-29 11:26:47,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 11:26:47,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +63: [2023-04-29 11:26:47,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 11:26:47,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +26: [2023-04-29 11:26:47,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +55: [2023-04-29 11:26:47,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +46: [2023-04-29 11:26:47,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 11:26:47,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 11:26:47,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 11:26:47,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +61: [2023-04-29 11:26:47,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 7: [2023-04-29 11:26:47,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +46: [2023-04-29 11:26:47,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +61: [2023-04-29 11:26:47,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +61: [2023-04-29 11:26:47,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 11:26:47,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 11:26:47,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 11:26:47,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +35: [2023-04-29 11:26:47,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +26: [2023-04-29 11:26:47,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +46: [2023-04-29 11:26:47,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +59: [2023-04-29 11:26:47,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +46: [2023-04-29 11:26:47,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 11:26:47,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +46: [2023-04-29 11:26:47,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 11:26:47,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +26: [2023-04-29 11:26:47,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +35: [2023-04-29 11:26:47,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +35: [2023-04-29 11:26:47,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 11:26:47,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 11:26:47,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +19: [2023-04-29 11:26:47,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +19: [2023-04-29 11:26:47,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +15: [2023-04-29 11:26:47,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +15: [2023-04-29 11:26:47,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +15: [2023-04-29 11:26:47,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +52: [2023-04-29 11:26:47,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +10: [2023-04-29 11:26:47,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 11:26:47,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +52: [2023-04-29 11:26:47,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +61: [2023-04-29 11:26:47,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +52: [2023-04-29 11:26:47,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 11:26:47,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 11:26:47,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +22: [2023-04-29 11:26:47,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +22: [2023-04-29 11:26:47,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +49: [2023-04-29 11:26:47,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 11:26:47,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +34: [2023-04-29 11:26:47,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 11:26:47,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 11:26:47,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +26: [2023-04-29 11:26:47,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +53: [2023-04-29 11:26:47,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +19: [2023-04-29 11:26:47,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +10: [2023-04-29 11:26:47,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +49: [2023-04-29 11:26:47,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +19: [2023-04-29 11:26:47,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +12: [2023-04-29 11:26:47,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +12: [2023-04-29 11:26:47,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +55: [2023-04-29 11:26:47,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 11:26:47,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 11:26:47,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +34: [2023-04-29 11:26:47,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +10: [2023-04-29 11:26:47,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 7: [2023-04-29 11:26:47,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +22: [2023-04-29 11:26:47,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 4: [2023-04-29 11:26:47,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 11:26:47,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +52: [2023-04-29 11:26:47,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +52: [2023-04-29 11:26:47,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 11:26:47,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +10: [2023-04-29 11:26:47,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +57: [2023-04-29 11:26:47,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 4: [2023-04-29 11:26:47,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +12: [2023-04-29 11:26:47,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +35: [2023-04-29 11:26:47,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +12: [2023-04-29 11:26:47,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +29: [2023-04-29 11:26:47,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +29: [2023-04-29 11:26:47,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +53: [2023-04-29 11:26:47,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +58: [2023-04-29 11:26:47,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +58: [2023-04-29 11:26:47,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +58: [2023-04-29 11:26:47,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 4: [2023-04-29 11:26:47,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +58: [2023-04-29 11:26:47,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +29: [2023-04-29 11:26:47,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 7: [2023-04-29 11:26:47,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 11:26:47,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +55: [2023-04-29 11:26:47,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 11:26:47,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 11:26:47,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 11:26:47,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 11:26:47,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 11:26:47,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +30: [2023-04-29 11:26:47,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 11:26:47,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 11:26:47,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +46: [2023-04-29 11:26:47,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +46: [2023-04-29 11:26:47,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +46: [2023-04-29 11:26:47,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 11:26:47,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 11:26:47,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +59: [2023-04-29 11:26:47,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 11:26:47,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 11:26:47,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 11:26:47,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 11:26:47,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 11:26:47,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 11:26:47,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 11:26:47,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +55: [2023-04-29 11:26:47,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +18: [2023-04-29 11:26:47,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +18: [2023-04-29 11:26:47,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +18: [2023-04-29 11:26:47,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +18: [2023-04-29 11:26:47,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +53: [2023-04-29 11:26:47,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:47,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:47,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +30: [2023-04-29 11:26:47,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 11:26:47,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 11:26:47,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 11:26:47,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +42: [2023-04-29 11:26:47,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +59: [2023-04-29 11:26:47,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +59: [2023-04-29 11:26:47,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +55: [2023-04-29 11:26:47,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +17: [2023-04-29 11:26:47,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +17: [2023-04-29 11:26:47,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +17: [2023-04-29 11:26:47,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 7: [2023-04-29 11:26:47,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 11:26:47,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +53: [2023-04-29 11:26:47,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +49: [2023-04-29 11:26:47,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 11:26:47,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:47,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 11:26:47,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +56: [2023-04-29 11:26:47,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 11:26:47,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +59: [2023-04-29 11:26:47,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 11:26:47,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:47,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 11:26:47,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +50: [2023-04-29 11:26:47,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +50: [2023-04-29 11:26:47,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +50: [2023-04-29 11:26:47,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +19: [2023-04-29 11:26:47,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +42: [2023-04-29 11:26:47,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 11:26:47,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 3: [2023-04-29 11:26:47,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +56: [2023-04-29 11:26:47,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +15: [2023-04-29 11:26:47,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +53: [2023-04-29 11:26:47,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 3: [2023-04-29 11:26:47,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +36: [2023-04-29 11:26:47,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +59: [2023-04-29 11:26:47,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +51: [2023-04-29 11:26:47,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +51: [2023-04-29 11:26:47,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +19: [2023-04-29 11:26:47,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 11:26:47,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 11:26:47,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +19: [2023-04-29 11:26:47,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 11:26:47,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +60: [2023-04-29 11:26:47,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +12: [2023-04-29 11:26:47,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +60: [2023-04-29 11:26:47,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +15: [2023-04-29 11:26:47,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +47: [2023-04-29 11:26:47,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +36: [2023-04-29 11:26:47,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +12: [2023-04-29 11:26:47,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +51: [2023-04-29 11:26:47,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:47,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +22: [2023-04-29 11:26:47,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 11:26:47,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +53: [2023-04-29 11:26:47,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +44: [2023-04-29 11:26:47,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +12: [2023-04-29 11:26:47,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 11:26:47,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +59: [2023-04-29 11:26:47,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 11:26:47,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 11:26:47,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 11:26:47,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 11:26:47,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 11:26:47,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 11:26:47,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +45: [2023-04-29 11:26:47,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +45: [2023-04-29 11:26:47,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +45: [2023-04-29 11:26:47,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +60: [2023-04-29 11:26:47,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +45: [2023-04-29 11:26:47,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +49: [2023-04-29 11:26:47,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +55: [2023-04-29 11:26:47,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 11:26:47,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +60: [2023-04-29 11:26:47,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 11:26:47,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +19: [2023-04-29 11:26:47,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +41: [2023-04-29 11:26:47,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 11:26:47,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 11:26:47,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +41: [2023-04-29 11:26:47,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +47: [2023-04-29 11:26:47,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +36: [2023-04-29 11:26:47,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +30: [2023-04-29 11:26:47,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +29: [2023-04-29 11:26:47,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +47: [2023-04-29 11:26:47,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +36: [2023-04-29 11:26:47,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 11:26:47,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +58: [2023-04-29 11:26:47,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 11:26:47,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 11:26:47,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +44: [2023-04-29 11:26:47,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 11:26:47,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +38: [2023-04-29 11:26:47,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +38: [2023-04-29 11:26:47,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +38: [2023-04-29 11:26:47,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +29: [2023-04-29 11:26:47,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +30: [2023-04-29 11:26:47,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 11:26:47,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 11:26:47,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 11:26:47,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 11:26:47,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +29: [2023-04-29 11:26:47,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +41: [2023-04-29 11:26:47,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +29: [2023-04-29 11:26:47,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +36: [2023-04-29 11:26:47,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +41: [2023-04-29 11:26:47,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:47,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:47,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +44: [2023-04-29 11:26:47,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +47: [2023-04-29 11:26:47,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +51: [2023-04-29 11:26:47,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +51: [2023-04-29 11:26:47,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +51: [2023-04-29 11:26:47,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +51: [2023-04-29 11:26:47,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +16: [2023-04-29 11:26:47,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 11:26:47,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +22: [2023-04-29 11:26:47,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +58: [2023-04-29 11:26:47,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +58: [2023-04-29 11:26:47,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 11:26:47,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +39: [2023-04-29 11:26:47,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 11:26:47,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 11:26:47,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +18: [2023-04-29 11:26:47,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +16: [2023-04-29 11:26:47,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 11:26:47,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +44: [2023-04-29 11:26:47,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +42: [2023-04-29 11:26:47,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 11:26:47,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +36: [2023-04-29 11:26:47,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +39: [2023-04-29 11:26:47,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +44: [2023-04-29 11:26:47,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 7: [2023-04-29 11:26:47,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +19: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +31: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +51: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 7: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +18: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +31: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +51: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +31: [2023-04-29 11:26:47,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +51: [2023-04-29 11:26:47,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 11:26:47,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +44: [2023-04-29 11:26:47,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +54: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +17: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +54: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +18: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +54: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +12: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +12: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +54: [2023-04-29 11:26:47,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +30: [2023-04-29 11:26:47,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 11:26:47,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +12: [2023-04-29 11:26:47,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +51: [2023-04-29 11:26:47,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 11:26:47,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 11:26:47,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +19: [2023-04-29 11:26:47,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +39: [2023-04-29 11:26:47,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 11:26:47,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +28: [2023-04-29 11:26:47,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +28: [2023-04-29 11:26:47,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +16: [2023-04-29 11:26:47,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +16: [2023-04-29 11:26:47,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +47: [2023-04-29 11:26:47,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 11:26:47,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +59: [2023-04-29 11:26:47,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 11:26:47,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 2: [2023-04-29 11:26:47,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 2: [2023-04-29 11:26:47,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 3: [2023-04-29 11:26:47,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 11:26:47,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +50: [2023-04-29 11:26:47,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +51: [2023-04-29 11:26:47,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +54: [2023-04-29 11:26:47,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +54: [2023-04-29 11:26:47,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... + 3: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +54: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +50: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +50: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +37: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +12: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 11:26:47,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +12: [2023-04-29 11:26:47,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 11:26:47,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +54: [2023-04-29 11:26:47,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +12: [2023-04-29 11:26:47,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 11:26:47,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +16: [2023-04-29 11:26:47,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +47: [2023-04-29 11:26:47,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 11:26:47,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +42: [2023-04-29 11:26:47,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 11:26:47,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +45: [2023-04-29 11:26:47,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 11:26:47,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +43: [2023-04-29 11:26:47,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +59: [2023-04-29 11:26:47,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +45: [2023-04-29 11:26:47,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 11:26:47,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +54: [2023-04-29 11:26:47,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +54: [2023-04-29 11:26:47,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +43: [2023-04-29 11:26:47,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +54: [2023-04-29 11:26:47,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 11:26:47,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 11:26:47,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 6: [2023-04-29 11:26:47,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +41: [2023-04-29 11:26:47,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +16: [2023-04-29 11:26:47,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +16: [2023-04-29 11:26:47,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +16: [2023-04-29 11:26:47,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +35: [2023-04-29 11:26:47,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +19: [2023-04-29 11:26:47,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +41: [2023-04-29 11:26:47,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +45: [2023-04-29 11:26:47,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 11:26:47,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:47,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +47: [2023-04-29 11:26:47,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +10: [2023-04-29 11:26:47,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 11:26:47,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +45: [2023-04-29 11:26:47,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 11:26:47,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 11:26:47,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +16: [2023-04-29 11:26:47,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +46: [2023-04-29 11:26:47,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +19: [2023-04-29 11:26:47,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +37: [2023-04-29 11:26:47,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +37: [2023-04-29 11:26:47,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 11:26:47,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 11:26:47,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 11:26:47,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 11:26:47,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +47: [2023-04-29 11:26:47,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +38: [2023-04-29 11:26:47,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +16: [2023-04-29 11:26:47,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +38: [2023-04-29 11:26:47,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +38: [2023-04-29 11:26:47,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +10: [2023-04-29 11:26:47,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +38: [2023-04-29 11:26:47,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +42: [2023-04-29 11:26:47,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 11:26:47,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +52: [2023-04-29 11:26:47,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +37: [2023-04-29 11:26:47,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 11:26:47,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +46: [2023-04-29 11:26:47,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +13: [2023-04-29 11:26:47,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +13: [2023-04-29 11:26:47,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +39: [2023-04-29 11:26:47,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +13: [2023-04-29 11:26:47,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +47: [2023-04-29 11:26:47,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +19: [2023-04-29 11:26:47,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 11:26:47,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +21: [2023-04-29 11:26:47,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +35: [2023-04-29 11:26:47,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 11:26:47,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +11: [2023-04-29 11:26:47,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +11: [2023-04-29 11:26:47,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +13: [2023-04-29 11:26:47,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +11: [2023-04-29 11:26:47,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +52: [2023-04-29 11:26:47,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +21: [2023-04-29 11:26:47,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +11: [2023-04-29 11:26:47,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +21: [2023-04-29 11:26:47,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +31: [2023-04-29 11:26:47,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +16: [2023-04-29 11:26:47,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +10: [2023-04-29 11:26:47,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +10: [2023-04-29 11:26:47,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +52: [2023-04-29 11:26:47,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 11:26:47,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +37: [2023-04-29 11:26:47,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 6: [2023-04-29 11:26:47,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +19: [2023-04-29 11:26:47,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 11:26:47,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 11:26:47,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +45: [2023-04-29 11:26:47,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +10: [2023-04-29 11:26:47,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +55: [2023-04-29 11:26:47,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +55: [2023-04-29 11:26:47,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +37: [2023-04-29 11:26:47,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +31: [2023-04-29 11:26:47,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +52: [2023-04-29 11:26:47,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +31: [2023-04-29 11:26:47,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +55: [2023-04-29 11:26:47,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +62: [2023-04-29 11:26:47,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 11:26:47,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 11:26:47,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 11:26:47,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +37: [2023-04-29 11:26:47,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +62: [2023-04-29 11:26:47,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 11:26:47,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 11:26:47,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 11:26:47,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 11:26:47,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 11:26:47,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 11:26:47,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 11:26:47,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 11:26:47,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 11:26:47,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +33: [2023-04-29 11:26:47,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +28: [2023-04-29 11:26:47,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +28: [2023-04-29 11:26:47,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +10: [2023-04-29 11:26:47,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +10: [2023-04-29 11:26:47,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +39: [2023-04-29 11:26:47,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +39: [2023-04-29 11:26:47,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +46: [2023-04-29 11:26:47,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 11:26:47,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +56: [2023-04-29 11:26:47,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +10: [2023-04-29 11:26:47,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +62: [2023-04-29 11:26:47,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 11:26:47,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 11:26:47,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 11:26:47,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +28: [2023-04-29 11:26:47,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +62: [2023-04-29 11:26:47,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +33: [2023-04-29 11:26:47,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 11:26:47,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 11:26:47,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 11:26:47,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 11:26:47,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +39: [2023-04-29 11:26:47,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +28: [2023-04-29 11:26:47,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 11:26:47,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 11:26:47,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... + 6: [2023-04-29 11:26:47,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +62: [2023-04-29 11:26:47,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +33: [2023-04-29 11:26:47,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +33: [2023-04-29 11:26:47,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 11:26:47,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +43: [2023-04-29 11:26:47,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 11:26:47,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 11:26:47,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 11:26:47,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +52: [2023-04-29 11:26:47,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +41: [2023-04-29 11:26:47,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +39: [2023-04-29 11:26:47,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +29: [2023-04-29 11:26:47,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +39: [2023-04-29 11:26:47,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +43: [2023-04-29 11:26:47,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +29: [2023-04-29 11:26:47,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +29: [2023-04-29 11:26:47,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 5: [2023-04-29 11:26:47,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 5: [2023-04-29 11:26:47,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. + 5: [2023-04-29 11:26:47,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +43: [2023-04-29 11:26:47,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +43: [2023-04-29 11:26:47,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 11:26:47,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +29: [2023-04-29 11:26:47,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +35: [2023-04-29 11:26:47,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +23: [2023-04-29 11:26:47,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +23: [2023-04-29 11:26:47,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +48: [2023-04-29 11:26:47,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +48: [2023-04-29 11:26:47,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +48: [2023-04-29 11:26:47,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +23: [2023-04-29 11:26:47,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +48: [2023-04-29 11:26:47,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +23: [2023-04-29 11:26:47,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +41: [2023-04-29 11:26:47,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:47,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +30: [2023-04-29 11:26:47,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 11:26:47,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +46: [2023-04-29 11:26:47,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +46: [2023-04-29 11:26:47,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +41: [2023-04-29 11:26:47,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +19: [2023-04-29 11:26:47,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 11:26:47,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +52: [2023-04-29 11:26:47,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 11:26:47,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +33: [2023-04-29 11:26:47,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +33: [2023-04-29 11:26:47,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. + 1: [2023-04-29 11:26:47,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +33: [2023-04-29 11:26:47,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +29: [2023-04-29 11:26:47,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 11:26:47,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +46: [2023-04-29 11:26:47,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +12: [2023-04-29 11:26:47,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +11: [2023-04-29 11:26:47,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +19: [2023-04-29 11:26:47,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +27: [2023-04-29 11:26:47,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +27: [2023-04-29 11:26:47,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +27: [2023-04-29 11:26:47,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +56: [2023-04-29 11:26:47,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +29: [2023-04-29 11:26:47,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 11:26:47,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +60: [2023-04-29 11:26:47,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 11:26:47,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +29: [2023-04-29 11:26:47,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 11:26:47,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +25: [2023-04-29 11:26:47,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +29: [2023-04-29 11:26:47,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +48: [2023-04-29 11:26:47,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 11:26:47,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 11:26:47,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +25: [2023-04-29 11:26:47,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +25: [2023-04-29 11:26:47,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +48: [2023-04-29 11:26:47,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 11:26:47,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 11:26:47,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +48: [2023-04-29 11:26:47,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +12: [2023-04-29 11:26:47,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +12: [2023-04-29 11:26:47,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +21: [2023-04-29 11:26:47,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +48: [2023-04-29 11:26:47,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +13: [2023-04-29 11:26:47,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +58: [2023-04-29 11:26:47,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:47,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +22: [2023-04-29 11:26:47,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 11:26:47,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +13: [2023-04-29 11:26:47,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +13: [2023-04-29 11:26:47,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +29: [2023-04-29 11:26:47,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +47: [2023-04-29 11:26:47,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 11:26:47,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +52: [2023-04-29 11:26:47,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +19: [2023-04-29 11:26:47,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 11:26:47,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 11:26:47,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +35: [2023-04-29 11:26:47,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +35: [2023-04-29 11:26:47,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +51: [2023-04-29 11:26:47,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 11:26:47,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +13: [2023-04-29 11:26:47,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +46: [2023-04-29 11:26:47,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +43: [2023-04-29 11:26:47,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +12: [2023-04-29 11:26:47,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +12: [2023-04-29 11:26:47,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +52: [2023-04-29 11:26:47,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +52: [2023-04-29 11:26:47,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +52: [2023-04-29 11:26:47,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +46: [2023-04-29 11:26:47,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +29: [2023-04-29 11:26:47,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +58: [2023-04-29 11:26:47,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +52: [2023-04-29 11:26:47,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +21: [2023-04-29 11:26:47,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +35: [2023-04-29 11:26:47,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 11:26:47,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +19: [2023-04-29 11:26:47,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 0: [2023-04-29 11:26:47,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +58: [2023-04-29 11:26:47,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +29: [2023-04-29 11:26:47,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 11:26:47,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +18: [2023-04-29 11:26:47,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +56: [2023-04-29 11:26:47,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +56: [2023-04-29 11:26:47,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +22: [2023-04-29 11:26:47,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 11:26:47,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 11:26:47,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +56: [2023-04-29 11:26:47,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +22: [2023-04-29 11:26:47,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +22: [2023-04-29 11:26:47,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +11: [2023-04-29 11:26:47,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +17: [2023-04-29 11:26:47,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +56: [2023-04-29 11:26:47,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 7: [2023-04-29 11:26:47,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +52: [2023-04-29 11:26:47,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +11: [2023-04-29 11:26:47,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +22: [2023-04-29 11:26:47,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +46: [2023-04-29 11:26:47,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +41: [2023-04-29 11:26:47,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +46: [2023-04-29 11:26:47,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +40: [2023-04-29 11:26:47,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +40: [2023-04-29 11:26:47,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +40: [2023-04-29 11:26:47,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +40: [2023-04-29 11:26:47,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +55: [2023-04-29 11:26:47,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +55: [2023-04-29 11:26:47,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +18: [2023-04-29 11:26:47,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +18: [2023-04-29 11:26:47,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +18: [2023-04-29 11:26:47,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +46: [2023-04-29 11:26:47,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +56: [2023-04-29 11:26:47,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +60: [2023-04-29 11:26:47,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +29: [2023-04-29 11:26:47,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +12: [2023-04-29 11:26:47,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +39: [2023-04-29 11:26:47,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +19: [2023-04-29 11:26:47,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +58: [2023-04-29 11:26:47,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +12: [2023-04-29 11:26:47,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +17: [2023-04-29 11:26:47,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 7: [2023-04-29 11:26:47,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +54: [2023-04-29 11:26:47,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +22: [2023-04-29 11:26:47,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +58: [2023-04-29 11:26:47,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +30: [2023-04-29 11:26:47,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 11:26:47,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +50: [2023-04-29 11:26:47,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +18: [2023-04-29 11:26:47,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +55: [2023-04-29 11:26:47,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +55: [2023-04-29 11:26:47,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +39: [2023-04-29 11:26:47,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +18: [2023-04-29 11:26:47,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +43: [2023-04-29 11:26:47,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 11:26:47,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 11:26:47,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +41: [2023-04-29 11:26:47,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +17: [2023-04-29 11:26:47,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +18: [2023-04-29 11:26:47,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +50: [2023-04-29 11:26:47,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +52: [2023-04-29 11:26:47,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +18: [2023-04-29 11:26:47,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +18: [2023-04-29 11:26:47,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 11:26:47,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +54: [2023-04-29 11:26:47,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +23: [2023-04-29 11:26:47,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +18: [2023-04-29 11:26:47,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 11:26:47,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +18: [2023-04-29 11:26:47,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +35: [2023-04-29 11:26:47,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 11:26:47,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +23: [2023-04-29 11:26:47,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +51: [2023-04-29 11:26:47,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 11:26:47,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 11:26:47,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 11:26:47,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +39: [2023-04-29 11:26:47,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +41: [2023-04-29 11:26:47,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 11:26:47,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +23: [2023-04-29 11:26:47,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 11:26:47,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +19: [2023-04-29 11:26:47,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +29: [2023-04-29 11:26:47,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +33: [2023-04-29 11:26:47,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +29: [2023-04-29 11:26:47,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +43: [2023-04-29 11:26:47,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 11:26:47,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 11:26:47,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +50: [2023-04-29 11:26:47,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +50: [2023-04-29 11:26:47,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +50: [2023-04-29 11:26:47,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +17: [2023-04-29 11:26:47,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 7: [2023-04-29 11:26:47,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +17: [2023-04-29 11:26:47,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +27: [2023-04-29 11:26:47,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +49: [2023-04-29 11:26:47,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +49: [2023-04-29 11:26:47,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +27: [2023-04-29 11:26:47,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +30: [2023-04-29 11:26:47,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 11:26:47,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +49: [2023-04-29 11:26:47,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +56: [2023-04-29 11:26:47,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +27: [2023-04-29 11:26:47,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +27: [2023-04-29 11:26:47,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +18: [2023-04-29 11:26:47,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +30: [2023-04-29 11:26:47,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +18: [2023-04-29 11:26:47,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +50: [2023-04-29 11:26:47,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +25: [2023-04-29 11:26:47,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +58: [2023-04-29 11:26:47,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +54: [2023-04-29 11:26:47,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 11:26:47,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +30: [2023-04-29 11:26:47,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +18: [2023-04-29 11:26:47,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +33: [2023-04-29 11:26:47,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +19: [2023-04-29 11:26:47,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +12: [2023-04-29 11:26:47,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +12: [2023-04-29 11:26:47,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 11:26:47,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +25: [2023-04-29 11:26:47,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:47,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 11:26:47,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +19: [2023-04-29 11:26:47,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +50: [2023-04-29 11:26:47,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +56: [2023-04-29 11:26:47,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +17: [2023-04-29 11:26:47,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +25: [2023-04-29 11:26:47,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +45: [2023-04-29 11:26:47,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +51: [2023-04-29 11:26:47,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +50: [2023-04-29 11:26:47,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +29: [2023-04-29 11:26:47,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +12: [2023-04-29 11:26:47,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +19: [2023-04-29 11:26:47,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +12: [2023-04-29 11:26:47,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +38: [2023-04-29 11:26:47,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 11:26:47,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +25: [2023-04-29 11:26:47,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 11:26:47,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +45: [2023-04-29 11:26:47,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +25: [2023-04-29 11:26:47,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +62: [2023-04-29 11:26:47,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +18: [2023-04-29 11:26:47,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +25: [2023-04-29 11:26:47,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +43: [2023-04-29 11:26:47,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +45: [2023-04-29 11:26:47,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +35: [2023-04-29 11:26:47,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 11:26:47,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 11:26:47,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +35: [2023-04-29 11:26:47,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +31: [2023-04-29 11:26:47,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +35: [2023-04-29 11:26:47,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 11:26:47,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +40: [2023-04-29 11:26:47,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +25: [2023-04-29 11:26:47,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +38: [2023-04-29 11:26:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 11:26:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +25: [2023-04-29 11:26:47,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +38: [2023-04-29 11:26:47,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +38: [2023-04-29 11:26:47,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +25: [2023-04-29 11:26:47,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 11:26:47,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +45: [2023-04-29 11:26:47,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 8: [2023-04-29 11:26:47,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 8: [2023-04-29 11:26:47,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 8: [2023-04-29 11:26:47,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +15: [2023-04-29 11:26:47,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 11:26:47,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +56: [2023-04-29 11:26:47,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +40: [2023-04-29 11:26:47,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +15: [2023-04-29 11:26:47,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 11:26:47,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 11:26:47,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 11:26:47,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 11:26:47,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +31: [2023-04-29 11:26:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +41: [2023-04-29 11:26:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 11:26:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +15: [2023-04-29 11:26:47,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +60: [2023-04-29 11:26:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 11:26:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +40: [2023-04-29 11:26:47,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 11:26:47,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 11:26:47,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +56: [2023-04-29 11:26:47,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +45: [2023-04-29 11:26:47,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +38: [2023-04-29 11:26:47,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +45: [2023-04-29 11:26:47,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +38: [2023-04-29 11:26:47,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +51: [2023-04-29 11:26:47,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 11:26:47,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +42: [2023-04-29 11:26:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +42: [2023-04-29 11:26:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +21: [2023-04-29 11:26:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +42: [2023-04-29 11:26:47,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +15: [2023-04-29 11:26:47,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +28: [2023-04-29 11:26:47,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +42: [2023-04-29 11:26:47,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +51: [2023-04-29 11:26:47,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +20: [2023-04-29 11:26:47,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +60: [2023-04-29 11:26:47,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +20: [2023-04-29 11:26:47,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +15: [2023-04-29 11:26:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +51: [2023-04-29 11:26:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 11:26:47,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 11:26:47,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +15: [2023-04-29 11:26:47,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +31: [2023-04-29 11:26:47,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 11:26:47,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_13-model_01-model_states.pt. +28: [2023-04-29 11:26:47,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +60: [2023-04-29 11:26:47,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +54: [2023-04-29 11:26:47,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +45: [2023-04-29 11:26:47,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +54: [2023-04-29 11:26:47,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 1: [2023-04-29 11:26:47,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 2: [2023-04-29 11:26:47,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 11:26:47,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 11:26:47,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +41: [2023-04-29 11:26:47,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +49: [2023-04-29 11:26:47,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +49: [2023-04-29 11:26:47,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +15: [2023-04-29 11:26:47,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +49: [2023-04-29 11:26:47,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +15: [2023-04-29 11:26:47,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 11:26:47,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +31: [2023-04-29 11:26:47,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +15: [2023-04-29 11:26:47,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 1: [2023-04-29 11:26:47,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 1: [2023-04-29 11:26:47,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +54: [2023-04-29 11:26:47,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 11:26:47,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +21: [2023-04-29 11:26:47,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +40: [2023-04-29 11:26:47,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 11:26:47,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 11:26:47,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 11:26:47,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +28: [2023-04-29 11:26:47,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 11:26:47,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +45: [2023-04-29 11:26:47,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 11:26:47,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +49: [2023-04-29 11:26:47,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +28: [2023-04-29 11:26:47,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +33: [2023-04-29 11:26:47,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +28: [2023-04-29 11:26:47,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +22: [2023-04-29 11:26:47,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 11:26:47,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 11:26:47,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 11:26:47,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 0: [2023-04-29 11:26:47,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +43: [2023-04-29 11:26:47,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 0: [2023-04-29 11:26:47,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +31: [2023-04-29 11:26:47,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 2: [2023-04-29 11:26:47,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +45: [2023-04-29 11:26:47,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 11:26:47,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +31: [2023-04-29 11:26:47,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +12: [2023-04-29 11:26:47,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +12: [2023-04-29 11:26:47,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +45: [2023-04-29 11:26:47,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +48: [2023-04-29 11:26:47,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +31: [2023-04-29 11:26:47,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +40: [2023-04-29 11:26:47,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +40: [2023-04-29 11:26:47,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +28: [2023-04-29 11:26:47,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +33: [2023-04-29 11:26:47,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 11:26:47,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +28: [2023-04-29 11:26:47,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +22: [2023-04-29 11:26:47,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +29: [2023-04-29 11:26:47,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +12: [2023-04-29 11:26:47,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +43: [2023-04-29 11:26:47,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +40: [2023-04-29 11:26:47,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +40: [2023-04-29 11:26:47,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +29: [2023-04-29 11:26:47,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 11:26:47,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +22: [2023-04-29 11:26:47,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +11: [2023-04-29 11:26:47,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +62: [2023-04-29 11:26:47,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 11:26:47,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 11:26:47,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 11:26:47,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +12: [2023-04-29 11:26:47,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 11:26:47,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +24: [2023-04-29 11:26:47,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +57: [2023-04-29 11:26:47,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +57: [2023-04-29 11:26:47,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +57: [2023-04-29 11:26:47,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +24: [2023-04-29 11:26:47,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 11:26:47,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +45: [2023-04-29 11:26:47,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 11:26:47,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +24: [2023-04-29 11:26:47,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 11:26:47,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 11:26:47,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 11:26:47,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 11:26:47,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +48: [2023-04-29 11:26:47,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +13: [2023-04-29 11:26:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 11:26:47,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +13: [2023-04-29 11:26:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +13: [2023-04-29 11:26:47,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +41: [2023-04-29 11:26:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +43: [2023-04-29 11:26:47,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +43: [2023-04-29 11:26:47,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +14: [2023-04-29 11:26:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +24: [2023-04-29 11:26:47,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +48: [2023-04-29 11:26:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +14: [2023-04-29 11:26:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +14: [2023-04-29 11:26:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +14: [2023-04-29 11:26:47,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 2: [2023-04-29 11:26:47,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 11:26:47,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 11:26:47,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +29: [2023-04-29 11:26:47,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +29: [2023-04-29 11:26:47,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +48: [2023-04-29 11:26:47,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +13: [2023-04-29 11:26:47,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +52: [2023-04-29 11:26:47,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +62: [2023-04-29 11:26:47,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +24: [2023-04-29 11:26:47,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +24: [2023-04-29 11:26:47,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +43: [2023-04-29 11:26:47,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +21: [2023-04-29 11:26:47,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 11:26:47,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +24: [2023-04-29 11:26:47,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 11:26:47,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +13: [2023-04-29 11:26:47,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +24: [2023-04-29 11:26:47,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 2: [2023-04-29 11:26:47,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +24: [2023-04-29 11:26:47,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +13: [2023-04-29 11:26:47,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 0: [2023-04-29 11:26:47,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +41: [2023-04-29 11:26:47,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +41: [2023-04-29 11:26:47,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +21: [2023-04-29 11:26:47,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +52: [2023-04-29 11:26:47,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +52: [2023-04-29 11:26:47,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +33: [2023-04-29 11:26:47,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +55: [2023-04-29 11:26:47,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 1: [2023-04-29 11:26:47,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +42: [2023-04-29 11:26:47,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +20: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +42: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +62: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +52: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +63: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +42: [2023-04-29 11:26:47,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +18: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +41: [2023-04-29 11:26:47,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +43: [2023-04-29 11:26:47,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +52: [2023-04-29 11:26:47,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +63: [2023-04-29 11:26:47,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. +27: [2023-04-29 11:26:47,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +27: [2023-04-29 11:26:47,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +39: [2023-04-29 11:26:47,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 11:26:47,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 11:26:47,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_35-model_01-model_states.pt. + 8: [2023-04-29 11:26:47,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +52: [2023-04-29 11:26:47,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +52: [2023-04-29 11:26:47,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 1: [2023-04-29 11:26:47,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +55: [2023-04-29 11:26:47,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +21: [2023-04-29 11:26:47,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +21: [2023-04-29 11:26:47,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +18: [2023-04-29 11:26:47,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +18: [2023-04-29 11:26:47,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 11:26:47,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt... +33: [2023-04-29 11:26:47,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +18: [2023-04-29 11:26:47,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +41: [2023-04-29 11:26:47,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +41: [2023-04-29 11:26:47,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +45: [2023-04-29 11:26:47,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +52: [2023-04-29 11:26:47,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +11: [2023-04-29 11:26:47,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +48: [2023-04-29 11:26:47,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 11:26:47,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +29: [2023-04-29 11:26:47,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 11:26:47,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +27: [2023-04-29 11:26:47,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +45: [2023-04-29 11:26:47,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +29: [2023-04-29 11:26:47,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +33: [2023-04-29 11:26:47,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 11:26:47,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +11: [2023-04-29 11:26:47,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +55: [2023-04-29 11:26:47,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 11:26:47,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +39: [2023-04-29 11:26:47,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +55: [2023-04-29 11:26:47,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 11:26:47,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +27: [2023-04-29 11:26:47,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +27: [2023-04-29 11:26:47,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +11: [2023-04-29 11:26:47,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +21: [2023-04-29 11:26:47,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +21: [2023-04-29 11:26:47,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +21: [2023-04-29 11:26:47,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +21: [2023-04-29 11:26:47,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +39: [2023-04-29 11:26:47,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +11: [2023-04-29 11:26:47,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +57: [2023-04-29 11:26:47,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +35: [2023-04-29 11:26:47,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +39: [2023-04-29 11:26:47,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +27: [2023-04-29 11:26:47,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +57: [2023-04-29 11:26:47,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +57: [2023-04-29 11:26:47,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +55: [2023-04-29 11:26:47,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 11:26:47,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +14: [2023-04-29 11:26:47,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 11:26:47,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 11:26:47,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +55: [2023-04-29 11:26:47,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +48: [2023-04-29 11:26:47,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +55: [2023-04-29 11:26:47,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +25: [2023-04-29 11:26:47,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +11: [2023-04-29 11:26:47,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +21: [2023-04-29 11:26:47,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +61: [2023-04-29 11:26:47,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +21: [2023-04-29 11:26:47,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +61: [2023-04-29 11:26:47,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 11:26:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 11:26:47,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +61: [2023-04-29 11:26:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +21: [2023-04-29 11:26:47,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 11:26:47,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +33: [2023-04-29 11:26:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +48: [2023-04-29 11:26:47,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 11:26:47,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +11: [2023-04-29 11:26:47,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 3: [2023-04-29 11:26:47,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 11:26:47,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +39: [2023-04-29 11:26:47,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +25: [2023-04-29 11:26:47,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +28: [2023-04-29 11:26:47,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 11:26:47,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 11:26:47,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 11:26:47,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 11:26:47,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... + 0: [2023-04-29 11:26:47,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 11:26:47,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 11:26:47,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +56: [2023-04-29 11:26:47,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +55: [2023-04-29 11:26:47,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +48: [2023-04-29 11:26:47,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +25: [2023-04-29 11:26:47,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +25: [2023-04-29 11:26:47,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +14: [2023-04-29 11:26:47,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 11:26:47,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 11:26:47,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +25: [2023-04-29 11:26:47,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +61: [2023-04-29 11:26:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +61: [2023-04-29 11:26:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 11:26:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +61: [2023-04-29 11:26:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +33: [2023-04-29 11:26:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +28: [2023-04-29 11:26:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 11:26:47,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 11:26:47,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +18: [2023-04-29 11:26:47,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 11:26:47,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +28: [2023-04-29 11:26:47,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +56: [2023-04-29 11:26:47,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +28: [2023-04-29 11:26:47,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +33: [2023-04-29 11:26:47,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 11:26:47,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 11:26:47,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 11:26:47,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 11:26:47,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +49: [2023-04-29 11:26:47,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +23: [2023-04-29 11:26:47,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 11:26:47,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 11:26:47,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 11:26:47,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 11:26:47,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +63: [2023-04-29 11:26:47,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +63: [2023-04-29 11:26:47,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +25: [2023-04-29 11:26:47,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 11:26:47,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 11:26:47,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 11:26:47,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +40: [2023-04-29 11:26:47,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +11: [2023-04-29 11:26:47,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +11: [2023-04-29 11:26:47,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +35: [2023-04-29 11:26:47,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +35: [2023-04-29 11:26:47,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +35: [2023-04-29 11:26:47,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +11: [2023-04-29 11:26:47,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 11:26:47,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 11:26:47,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +40: [2023-04-29 11:26:47,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +18: [2023-04-29 11:26:47,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 11:26:47,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +27: [2023-04-29 11:26:47,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 11:26:47,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 11:26:47,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 11:26:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +18: [2023-04-29 11:26:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 11:26:47,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +56: [2023-04-29 11:26:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +27: [2023-04-29 11:26:47,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 11:26:47,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +26: [2023-04-29 11:26:47,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +25: [2023-04-29 11:26:47,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +33: [2023-04-29 11:26:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +26: [2023-04-29 11:26:47,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +18: [2023-04-29 11:26:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +33: [2023-04-29 11:26:47,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +49: [2023-04-29 11:26:47,596] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +23: [2023-04-29 11:26:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +23: [2023-04-29 11:26:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +23: [2023-04-29 11:26:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +11: [2023-04-29 11:26:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +63: [2023-04-29 11:26:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +23: [2023-04-29 11:26:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +23: [2023-04-29 11:26:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +40: [2023-04-29 11:26:47,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +23: [2023-04-29 11:26:47,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +33: [2023-04-29 11:26:47,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +31: [2023-04-29 11:26:47,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +31: [2023-04-29 11:26:47,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +56: [2023-04-29 11:26:47,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +56: [2023-04-29 11:26:47,599] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +35: [2023-04-29 11:26:47,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +35: [2023-04-29 11:26:47,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +35: [2023-04-29 11:26:47,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +23: [2023-04-29 11:26:47,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +63: [2023-04-29 11:26:47,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt... +40: [2023-04-29 11:26:47,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 11:26:47,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 11:26:47,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 11:26:47,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +31: [2023-04-29 11:26:47,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 11:26:47,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 11:26:47,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 11:26:47,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +27: [2023-04-29 11:26:47,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 11:26:47,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +49: [2023-04-29 11:26:47,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +11: [2023-04-29 11:26:47,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 11:26:47,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 11:26:47,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +33: [2023-04-29 11:26:47,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +27: [2023-04-29 11:26:47,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +49: [2023-04-29 11:26:47,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +49: [2023-04-29 11:26:47,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +40: [2023-04-29 11:26:47,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 11:26:47,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 11:26:47,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 11:26:47,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +40: [2023-04-29 11:26:47,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +56: [2023-04-29 11:26:47,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +31: [2023-04-29 11:26:47,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +56: [2023-04-29 11:26:47,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +31: [2023-04-29 11:26:47,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +40: [2023-04-29 11:26:47,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +49: [2023-04-29 11:26:47,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +20: [2023-04-29 11:26:47,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 11:26:47,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +49: [2023-04-29 11:26:47,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +31: [2023-04-29 11:26:47,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 11:26:47,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 11:26:47,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +58: [2023-04-29 11:26:47,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +25: [2023-04-29 11:26:47,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +58: [2023-04-29 11:26:47,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +58: [2023-04-29 11:26:47,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 11:26:47,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +58: [2023-04-29 11:26:47,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +20: [2023-04-29 11:26:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 11:26:47,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 11:26:47,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 11:26:47,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 11:26:47,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 11:26:47,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +58: [2023-04-29 11:26:47,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 11:26:47,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 11:26:47,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 11:26:47,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +22: [2023-04-29 11:26:47,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 11:26:47,619] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +40: [2023-04-29 11:26:47,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +40: [2023-04-29 11:26:47,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +25: [2023-04-29 11:26:47,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +24: [2023-04-29 11:26:47,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 11:26:47,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 0: [2023-04-29 11:26:47,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +20: [2023-04-29 11:26:47,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +25: [2023-04-29 11:26:47,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +15: [2023-04-29 11:26:47,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 9: [2023-04-29 11:26:47,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +26: [2023-04-29 11:26:47,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +40: [2023-04-29 11:26:47,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +13: [2023-04-29 11:26:47,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 11:26:47,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 11:26:47,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 11:26:47,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 11:26:47,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 11:26:47,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +42: [2023-04-29 11:26:47,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +42: [2023-04-29 11:26:47,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +17: [2023-04-29 11:26:47,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 11:26:47,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +42: [2023-04-29 11:26:47,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +26: [2023-04-29 11:26:47,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +42: [2023-04-29 11:26:47,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +22: [2023-04-29 11:26:47,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +20: [2023-04-29 11:26:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +40: [2023-04-29 11:26:47,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +24: [2023-04-29 11:26:47,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +15: [2023-04-29 11:26:47,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 8: [2023-04-29 11:26:47,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 11:26:47,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 11:26:47,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 11:26:47,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 11:26:47,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 11:26:47,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +17: [2023-04-29 11:26:47,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 11:26:47,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +42: [2023-04-29 11:26:47,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +42: [2023-04-29 11:26:47,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +42: [2023-04-29 11:26:47,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +26: [2023-04-29 11:26:47,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +42: [2023-04-29 11:26:47,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 1: [2023-04-29 11:26:47,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +20: [2023-04-29 11:26:47,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +17: [2023-04-29 11:26:47,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 11:26:47,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 11:26:47,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +32: [2023-04-29 11:26:47,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +32: [2023-04-29 11:26:47,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +32: [2023-04-29 11:26:47,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +32: [2023-04-29 11:26:47,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 11:26:47,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +20: [2023-04-29 11:26:47,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +20: [2023-04-29 11:26:47,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_00-model_states.pt. +53: [2023-04-29 11:26:47,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 11:26:47,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +24: [2023-04-29 11:26:47,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +53: [2023-04-29 11:26:47,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 11:26:47,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 8: [2023-04-29 11:26:47,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +57: [2023-04-29 11:26:47,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 8: [2023-04-29 11:26:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +24: [2023-04-29 11:26:47,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 11:26:47,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +21: [2023-04-29 11:26:47,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 11:26:47,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +32: [2023-04-29 11:26:47,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +32: [2023-04-29 11:26:47,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +57: [2023-04-29 11:26:47,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +32: [2023-04-29 11:26:47,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +21: [2023-04-29 11:26:47,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 11:26:47,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +28: [2023-04-29 11:26:47,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +53: [2023-04-29 11:26:47,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 11:26:47,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 11:26:47,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +57: [2023-04-29 11:26:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +53: [2023-04-29 11:26:47,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 11:26:47,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +21: [2023-04-29 11:26:47,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +40: [2023-04-29 11:26:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +53: [2023-04-29 11:26:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +26: [2023-04-29 11:26:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 11:26:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 11:26:47,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 11:26:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +20: [2023-04-29 11:26:47,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt... +61: [2023-04-29 11:26:47,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 11:26:47,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 11:26:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 8: [2023-04-29 11:26:47,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +14: [2023-04-29 11:26:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +40: [2023-04-29 11:26:47,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +57: [2023-04-29 11:26:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +57: [2023-04-29 11:26:47,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +57: [2023-04-29 11:26:47,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 1: [2023-04-29 11:26:47,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +23: [2023-04-29 11:26:47,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 11:26:47,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 11:26:47,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 11:26:47,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 11:26:47,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 11:26:47,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 11:26:47,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +61: [2023-04-29 11:26:47,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 11:26:47,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +30: [2023-04-29 11:26:47,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +30: [2023-04-29 11:26:47,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 3: [2023-04-29 11:26:47,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +57: [2023-04-29 11:26:47,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +14: [2023-04-29 11:26:47,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 11:26:47,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 11:26:47,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 11:26:47,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 11:26:47,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 11:26:47,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 11:26:47,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +24: [2023-04-29 11:26:47,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 11:26:47,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +28: [2023-04-29 11:26:47,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 11:26:47,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 11:26:47,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 11:26:47,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 11:26:47,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +14: [2023-04-29 11:26:47,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +26: [2023-04-29 11:26:47,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 11:26:47,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 11:26:47,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +63: [2023-04-29 11:26:47,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 11:26:47,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +14: [2023-04-29 11:26:47,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +14: [2023-04-29 11:26:47,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 11:26:47,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 11:26:47,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 11:26:47,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +63: [2023-04-29 11:26:47,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +63: [2023-04-29 11:26:47,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +63: [2023-04-29 11:26:47,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... +27: [2023-04-29 11:26:47,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 11:26:47,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 11:26:47,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +21: [2023-04-29 11:26:47,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +21: [2023-04-29 11:26:47,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +21: [2023-04-29 11:26:47,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +63: [2023-04-29 11:26:47,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_00-model_states.pt. +63: [2023-04-29 11:26:47,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 5: [2023-04-29 11:26:47,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +61: [2023-04-29 11:26:47,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +28: [2023-04-29 11:26:47,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 11:26:47,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 11:26:47,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +11: [2023-04-29 11:26:47,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 11:26:47,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 11:26:47,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 11:26:47,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +20: [2023-04-29 11:26:47,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 11:26:47,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 11:26:47,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +31: [2023-04-29 11:26:47,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +31: [2023-04-29 11:26:47,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +61: [2023-04-29 11:26:47,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 4: [2023-04-29 11:26:47,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 4: [2023-04-29 11:26:47,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 5: [2023-04-29 11:26:47,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 5: [2023-04-29 11:26:47,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +63: [2023-04-29 11:26:47,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +63: [2023-04-29 11:26:47,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +63: [2023-04-29 11:26:47,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +63: [2023-04-29 11:26:47,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +11: [2023-04-29 11:26:47,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +61: [2023-04-29 11:26:47,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 11:26:47,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 11:26:47,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 11:26:47,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 11:26:47,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +36: [2023-04-29 11:26:47,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 11:26:47,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt... + 5: [2023-04-29 11:26:47,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 11:26:47,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +58: [2023-04-29 11:26:47,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 6: [2023-04-29 11:26:47,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 6: [2023-04-29 11:26:47,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +30: [2023-04-29 11:26:47,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +30: [2023-04-29 11:26:47,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +30: [2023-04-29 11:26:47,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +58: [2023-04-29 11:26:47,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +58: [2023-04-29 11:26:47,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 11:26:47,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 11:26:47,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 11:26:47,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 11:26:47,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:47,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +58: [2023-04-29 11:26:47,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +36: [2023-04-29 11:26:47,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 11:26:47,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +36: [2023-04-29 11:26:47,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +63: [2023-04-29 11:26:47,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +63: [2023-04-29 11:26:47,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +63: [2023-04-29 11:26:47,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +36: [2023-04-29 11:26:47,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 11:26:47,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +23: [2023-04-29 11:26:47,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +20: [2023-04-29 11:26:47,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +34: [2023-04-29 11:26:47,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 11:26:47,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +27: [2023-04-29 11:26:47,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +34: [2023-04-29 11:26:47,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 11:26:47,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +20: [2023-04-29 11:26:47,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 11:26:47,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 11:26:47,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 11:26:47,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 11:26:47,699] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +13: [2023-04-29 11:26:47,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 11:26:47,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 11:26:47,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 11:26:47,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +27: [2023-04-29 11:26:47,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 11:26:47,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 11:26:47,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 11:26:47,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +53: [2023-04-29 11:26:47,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +16: [2023-04-29 11:26:47,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +16: [2023-04-29 11:26:47,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +16: [2023-04-29 11:26:47,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +17: [2023-04-29 11:26:47,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 11:26:47,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +26: [2023-04-29 11:26:47,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +20: [2023-04-29 11:26:47,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +23: [2023-04-29 11:26:47,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 11:26:47,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +57: [2023-04-29 11:26:47,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 11:26:47,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 11:26:47,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 11:26:47,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +13: [2023-04-29 11:26:47,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 11:26:47,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 9: [2023-04-29 11:26:47,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 11:26:47,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 11:26:47,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +20: [2023-04-29 11:26:47,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 11:26:47,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +31: [2023-04-29 11:26:47,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 11:26:47,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 11:26:47,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 11:26:47,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 11:26:47,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +53: [2023-04-29 11:26:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 11:26:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 11:26:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 11:26:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 11:26:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +50: [2023-04-29 11:26:47,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 11:26:47,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +57: [2023-04-29 11:26:47,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 11:26:47,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 11:26:47,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 11:26:47,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +26: [2023-04-29 11:26:47,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 11:26:47,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +26: [2023-04-29 11:26:47,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +57: [2023-04-29 11:26:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +57: [2023-04-29 11:26:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +57: [2023-04-29 11:26:47,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +32: [2023-04-29 11:26:47,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +32: [2023-04-29 11:26:47,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +32: [2023-04-29 11:26:47,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +32: [2023-04-29 11:26:47,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +58: [2023-04-29 11:26:47,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 11:26:47,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 11:26:47,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 11:26:47,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 11:26:47,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 11:26:47,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 11:26:47,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:47,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +44: [2023-04-29 11:26:47,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 11:26:47,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +26: [2023-04-29 11:26:47,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +50: [2023-04-29 11:26:47,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 11:26:47,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 11:26:47,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +26: [2023-04-29 11:26:47,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +50: [2023-04-29 11:26:47,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +20: [2023-04-29 11:26:47,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +13: [2023-04-29 11:26:47,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +20: [2023-04-29 11:26:47,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +14: [2023-04-29 11:26:47,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 11:26:47,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 11:26:47,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 11:26:47,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 11:26:47,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 11:26:47,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +14: [2023-04-29 11:26:47,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +53: [2023-04-29 11:26:47,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +16: [2023-04-29 11:26:47,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 11:26:47,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +10: [2023-04-29 11:26:47,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 11:26:47,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 11:26:47,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 11:26:47,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 8: [2023-04-29 11:26:47,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 11:26:47,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +17: [2023-04-29 11:26:47,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +17: [2023-04-29 11:26:47,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +17: [2023-04-29 11:26:47,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 11:26:47,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 11:26:47,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +16: [2023-04-29 11:26:47,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +16: [2023-04-29 11:26:47,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 11:26:47,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 11:26:47,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +13: [2023-04-29 11:26:47,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +10: [2023-04-29 11:26:47,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 11:26:47,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 11:26:47,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 11:26:47,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 11:26:47,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 11:26:47,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 11:26:47,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +26: [2023-04-29 11:26:47,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 11:26:47,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +10: [2023-04-29 11:26:47,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +59: [2023-04-29 11:26:47,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 11:26:47,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 11:26:47,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +19: [2023-04-29 11:26:47,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +10: [2023-04-29 11:26:47,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +59: [2023-04-29 11:26:47,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +17: [2023-04-29 11:26:47,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 11:26:47,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +29: [2023-04-29 11:26:47,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +29: [2023-04-29 11:26:47,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +29: [2023-04-29 11:26:47,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +30: [2023-04-29 11:26:47,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +53: [2023-04-29 11:26:47,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +53: [2023-04-29 11:26:47,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +19: [2023-04-29 11:26:47,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 11:26:47,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 11:26:47,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +34: [2023-04-29 11:26:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +34: [2023-04-29 11:26:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. + 7: [2023-04-29 11:26:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 11:26:47,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +34: [2023-04-29 11:26:47,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +16: [2023-04-29 11:26:47,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +34: [2023-04-29 11:26:47,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +16: [2023-04-29 11:26:47,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 11:26:47,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +34: [2023-04-29 11:26:47,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 11:26:47,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +30: [2023-04-29 11:26:47,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +16: [2023-04-29 11:26:47,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +38: [2023-04-29 11:26:47,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +38: [2023-04-29 11:26:47,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 11:26:47,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 11:26:47,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 11:26:47,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 11:26:47,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +38: [2023-04-29 11:26:47,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 11:26:47,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +32: [2023-04-29 11:26:47,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +59: [2023-04-29 11:26:47,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +48: [2023-04-29 11:26:47,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +48: [2023-04-29 11:26:47,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +32: [2023-04-29 11:26:47,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +48: [2023-04-29 11:26:47,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +48: [2023-04-29 11:26:47,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +30: [2023-04-29 11:26:47,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +36: [2023-04-29 11:26:47,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +16: [2023-04-29 11:26:47,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +59: [2023-04-29 11:26:47,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +53: [2023-04-29 11:26:47,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +16: [2023-04-29 11:26:47,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 11:26:47,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 11:26:47,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 11:26:47,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +16: [2023-04-29 11:26:47,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +38: [2023-04-29 11:26:47,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 11:26:47,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 11:26:47,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +26: [2023-04-29 11:26:47,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +34: [2023-04-29 11:26:47,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +26: [2023-04-29 11:26:47,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +14: [2023-04-29 11:26:47,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 11:26:47,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 2: [2023-04-29 11:26:47,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +63: [2023-04-29 11:26:47,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +63: [2023-04-29 11:26:47,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +14: [2023-04-29 11:26:47,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 11:26:47,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +39: [2023-04-29 11:26:47,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 11:26:47,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +63: [2023-04-29 11:26:47,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 11:26:47,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 11:26:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 11:26:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +31: [2023-04-29 11:26:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +31: [2023-04-29 11:26:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +31: [2023-04-29 11:26:47,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +35: [2023-04-29 11:26:47,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 11:26:47,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +17: [2023-04-29 11:26:47,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +14: [2023-04-29 11:26:47,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +55: [2023-04-29 11:26:47,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +55: [2023-04-29 11:26:47,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +17: [2023-04-29 11:26:47,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +55: [2023-04-29 11:26:47,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +30: [2023-04-29 11:26:47,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +55: [2023-04-29 11:26:47,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 11:26:47,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +35: [2023-04-29 11:26:47,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +17: [2023-04-29 11:26:47,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 11:26:47,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 11:26:47,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 11:26:47,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 11:26:47,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 11:26:47,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 11:26:47,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 11:26:47,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +37: [2023-04-29 11:26:47,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 3: [2023-04-29 11:26:47,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +37: [2023-04-29 11:26:47,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 11:26:47,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +36: [2023-04-29 11:26:47,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +26: [2023-04-29 11:26:47,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +55: [2023-04-29 11:26:47,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +30: [2023-04-29 11:26:47,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +55: [2023-04-29 11:26:47,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 11:26:47,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 11:26:47,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +17: [2023-04-29 11:26:47,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +55: [2023-04-29 11:26:47,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +14: [2023-04-29 11:26:47,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 11:26:47,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +35: [2023-04-29 11:26:47,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +63: [2023-04-29 11:26:47,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +29: [2023-04-29 11:26:47,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +29: [2023-04-29 11:26:47,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +29: [2023-04-29 11:26:47,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +37: [2023-04-29 11:26:47,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +37: [2023-04-29 11:26:47,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +37: [2023-04-29 11:26:47,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +30: [2023-04-29 11:26:47,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +35: [2023-04-29 11:26:47,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +37: [2023-04-29 11:26:47,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 11:26:47,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 11:26:47,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +47: [2023-04-29 11:26:47,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 11:26:47,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 11:26:47,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +48: [2023-04-29 11:26:47,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +22: [2023-04-29 11:26:47,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +22: [2023-04-29 11:26:47,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +36: [2023-04-29 11:26:47,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:47,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 11:26:47,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +46: [2023-04-29 11:26:47,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +48: [2023-04-29 11:26:47,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +48: [2023-04-29 11:26:47,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 11:26:47,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +22: [2023-04-29 11:26:47,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +47: [2023-04-29 11:26:47,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +48: [2023-04-29 11:26:47,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 11:26:47,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 11:26:47,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 11:26:47,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 11:26:47,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 11:26:47,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 11:26:47,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +34: [2023-04-29 11:26:47,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +47: [2023-04-29 11:26:47,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 11:26:47,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 11:26:47,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 11:26:47,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 11:26:47,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 11:26:47,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +21: [2023-04-29 11:26:47,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +21: [2023-04-29 11:26:47,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +57: [2023-04-29 11:26:47,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 6: [2023-04-29 11:26:47,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +46: [2023-04-29 11:26:47,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 11:26:47,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 2: [2023-04-29 11:26:47,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 2: [2023-04-29 11:26:47,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +47: [2023-04-29 11:26:47,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 11:26:47,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 11:26:47,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 11:26:47,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +34: [2023-04-29 11:26:47,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:47,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +57: [2023-04-29 11:26:47,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 11:26:47,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +56: [2023-04-29 11:26:47,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 11:26:47,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +21: [2023-04-29 11:26:47,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 4: [2023-04-29 11:26:47,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 11:26:47,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 5: [2023-04-29 11:26:47,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 6: [2023-04-29 11:26:47,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +47: [2023-04-29 11:26:47,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +63: [2023-04-29 11:26:47,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 11:26:47,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 11:26:47,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 11:26:47,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 11:26:47,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 11:26:47,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 11:26:47,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +56: [2023-04-29 11:26:47,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +49: [2023-04-29 11:26:47,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 11:26:47,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 11:26:47,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 11:26:47,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 11:26:47,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 11:26:47,792] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 11:26:47,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +61: [2023-04-29 11:26:47,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +61: [2023-04-29 11:26:47,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +61: [2023-04-29 11:26:47,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +52: [2023-04-29 11:26:47,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 11:26:47,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +60: [2023-04-29 11:26:47,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +60: [2023-04-29 11:26:47,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +49: [2023-04-29 11:26:47,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +31: [2023-04-29 11:26:47,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 11:26:47,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 11:26:47,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +57: [2023-04-29 11:26:47,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +52: [2023-04-29 11:26:47,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 4: [2023-04-29 11:26:47,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +52: [2023-04-29 11:26:47,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +31: [2023-04-29 11:26:47,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +52: [2023-04-29 11:26:47,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 11:26:47,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 11:26:47,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +49: [2023-04-29 11:26:47,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +50: [2023-04-29 11:26:47,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 11:26:47,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +19: [2023-04-29 11:26:47,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +49: [2023-04-29 11:26:47,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +10: [2023-04-29 11:26:47,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +36: [2023-04-29 11:26:47,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 11:26:47,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 11:26:47,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +16: [2023-04-29 11:26:47,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +10: [2023-04-29 11:26:47,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +42: [2023-04-29 11:26:47,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 11:26:47,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 11:26:47,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 11:26:47,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +22: [2023-04-29 11:26:47,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +54: [2023-04-29 11:26:47,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +54: [2023-04-29 11:26:47,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +54: [2023-04-29 11:26:47,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +54: [2023-04-29 11:26:47,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +38: [2023-04-29 11:26:47,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 11:26:47,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +10: [2023-04-29 11:26:47,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 11:26:47,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +42: [2023-04-29 11:26:47,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +42: [2023-04-29 11:26:47,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +22: [2023-04-29 11:26:47,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +53: [2023-04-29 11:26:47,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +53: [2023-04-29 11:26:47,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +53: [2023-04-29 11:26:47,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +42: [2023-04-29 11:26:47,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 11:26:47,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +57: [2023-04-29 11:26:47,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +28: [2023-04-29 11:26:47,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +28: [2023-04-29 11:26:47,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +16: [2023-04-29 11:26:47,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +42: [2023-04-29 11:26:47,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +10: [2023-04-29 11:26:47,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 11:26:47,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +22: [2023-04-29 11:26:47,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 11:26:47,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +19: [2023-04-29 11:26:47,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 11:26:47,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 11:26:47,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +21: [2023-04-29 11:26:47,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +16: [2023-04-29 11:26:47,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 11:26:47,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +61: [2023-04-29 11:26:47,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 11:26:47,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 11:26:47,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 11:26:47,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +22: [2023-04-29 11:26:47,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 11:26:47,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 11:26:47,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +57: [2023-04-29 11:26:47,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +60: [2023-04-29 11:26:47,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 11:26:47,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 11:26:47,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 11:26:47,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +21: [2023-04-29 11:26:47,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +60: [2023-04-29 11:26:47,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +16: [2023-04-29 11:26:47,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +38: [2023-04-29 11:26:47,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +19: [2023-04-29 11:26:47,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +61: [2023-04-29 11:26:47,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 2: [2023-04-29 11:26:47,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +50: [2023-04-29 11:26:47,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 11:26:47,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +16: [2023-04-29 11:26:47,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +10: [2023-04-29 11:26:47,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +37: [2023-04-29 11:26:47,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +37: [2023-04-29 11:26:47,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +37: [2023-04-29 11:26:47,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +37: [2023-04-29 11:26:47,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +16: [2023-04-29 11:26:47,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +34: [2023-04-29 11:26:47,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:47,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 11:26:47,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +29: [2023-04-29 11:26:47,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 11:26:47,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +59: [2023-04-29 11:26:47,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 11:26:47,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 11:26:47,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +38: [2023-04-29 11:26:47,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +38: [2023-04-29 11:26:47,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +11: [2023-04-29 11:26:47,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +11: [2023-04-29 11:26:47,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +39: [2023-04-29 11:26:47,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 11:26:47,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 11:26:47,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +16: [2023-04-29 11:26:47,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 11:26:47,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 11:26:47,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +17: [2023-04-29 11:26:47,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +29: [2023-04-29 11:26:47,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 7: [2023-04-29 11:26:47,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 11:26:47,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +50: [2023-04-29 11:26:47,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +17: [2023-04-29 11:26:47,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +54: [2023-04-29 11:26:47,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 11:26:47,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 11:26:47,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +59: [2023-04-29 11:26:47,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 11:26:47,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +16: [2023-04-29 11:26:47,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +54: [2023-04-29 11:26:47,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 11:26:47,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +11: [2023-04-29 11:26:47,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +11: [2023-04-29 11:26:47,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +48: [2023-04-29 11:26:47,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 11:26:47,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 11:26:47,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 11:26:47,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +55: [2023-04-29 11:26:47,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 11:26:47,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 11:26:47,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +54: [2023-04-29 11:26:47,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 11:26:47,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 11:26:47,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 11:26:47,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 7: [2023-04-29 11:26:47,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 11:26:47,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +53: [2023-04-29 11:26:47,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 11:26:47,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 11:26:47,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +29: [2023-04-29 11:26:47,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +29: [2023-04-29 11:26:47,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +55: [2023-04-29 11:26:47,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 11:26:47,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +48: [2023-04-29 11:26:47,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +17: [2023-04-29 11:26:47,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +17: [2023-04-29 11:26:47,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 11:26:47,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +48: [2023-04-29 11:26:47,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +28: [2023-04-29 11:26:47,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +28: [2023-04-29 11:26:47,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +41: [2023-04-29 11:26:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +41: [2023-04-29 11:26:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +41: [2023-04-29 11:26:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 11:26:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 11:26:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 11:26:47,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 11:26:47,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +36: [2023-04-29 11:26:47,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +36: [2023-04-29 11:26:47,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +55: [2023-04-29 11:26:47,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +55: [2023-04-29 11:26:47,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 11:26:47,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 11:26:47,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 11:26:47,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 11:26:47,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +29: [2023-04-29 11:26:47,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +19: [2023-04-29 11:26:47,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 11:26:47,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 11:26:47,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +43: [2023-04-29 11:26:47,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 11:26:47,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 11:26:47,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +17: [2023-04-29 11:26:47,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +52: [2023-04-29 11:26:47,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +17: [2023-04-29 11:26:47,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +19: [2023-04-29 11:26:47,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +38: [2023-04-29 11:26:47,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +48: [2023-04-29 11:26:47,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +48: [2023-04-29 11:26:47,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +29: [2023-04-29 11:26:47,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +10: [2023-04-29 11:26:47,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +46: [2023-04-29 11:26:47,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 11:26:47,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 11:26:47,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 11:26:47,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +29: [2023-04-29 11:26:47,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +60: [2023-04-29 11:26:47,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 11:26:47,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 11:26:47,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +41: [2023-04-29 11:26:47,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 11:26:47,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +48: [2023-04-29 11:26:47,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +31: [2023-04-29 11:26:47,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +41: [2023-04-29 11:26:47,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 11:26:47,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +27: [2023-04-29 11:26:47,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +27: [2023-04-29 11:26:47,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +11: [2023-04-29 11:26:47,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 11:26:47,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +56: [2023-04-29 11:26:47,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 11:26:47,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 11:26:47,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +62: [2023-04-29 11:26:47,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +27: [2023-04-29 11:26:47,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +29: [2023-04-29 11:26:47,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +39: [2023-04-29 11:26:47,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 11:26:47,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +51: [2023-04-29 11:26:47,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 11:26:47,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +56: [2023-04-29 11:26:47,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 11:26:47,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 11:26:47,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +46: [2023-04-29 11:26:47,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 11:26:47,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 11:26:47,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +31: [2023-04-29 11:26:47,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +62: [2023-04-29 11:26:47,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +59: [2023-04-29 11:26:47,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:47,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +48: [2023-04-29 11:26:47,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +37: [2023-04-29 11:26:47,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 11:26:47,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +43: [2023-04-29 11:26:47,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +43: [2023-04-29 11:26:47,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +43: [2023-04-29 11:26:47,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 3: [2023-04-29 11:26:47,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +51: [2023-04-29 11:26:47,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 11:26:47,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 11:26:47,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 11:26:47,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +51: [2023-04-29 11:26:47,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +51: [2023-04-29 11:26:47,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 11:26:47,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 11:26:47,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 11:26:47,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +31: [2023-04-29 11:26:47,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +59: [2023-04-29 11:26:47,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +55: [2023-04-29 11:26:47,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 11:26:47,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +51: [2023-04-29 11:26:47,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 11:26:47,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +16: [2023-04-29 11:26:47,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 11:26:47,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +34: [2023-04-29 11:26:47,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +34: [2023-04-29 11:26:47,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... + 7: [2023-04-29 11:26:47,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 11:26:47,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +39: [2023-04-29 11:26:47,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 11:26:47,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 11:26:47,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 11:26:47,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +52: [2023-04-29 11:26:47,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 11:26:47,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +31: [2023-04-29 11:26:47,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +37: [2023-04-29 11:26:47,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +37: [2023-04-29 11:26:47,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 11:26:47,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 11:26:47,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +37: [2023-04-29 11:26:47,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +34: [2023-04-29 11:26:47,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +11: [2023-04-29 11:26:47,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +22: [2023-04-29 11:26:47,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +47: [2023-04-29 11:26:47,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +39: [2023-04-29 11:26:47,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +39: [2023-04-29 11:26:47,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 7: [2023-04-29 11:26:47,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 11:26:47,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +31: [2023-04-29 11:26:47,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +47: [2023-04-29 11:26:47,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 11:26:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 11:26:47,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 11:26:47,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 11:26:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 11:26:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +22: [2023-04-29 11:26:47,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +49: [2023-04-29 11:26:47,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 11:26:47,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 11:26:47,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 11:26:47,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 11:26:47,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 3: [2023-04-29 11:26:47,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +34: [2023-04-29 11:26:47,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +11: [2023-04-29 11:26:47,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +11: [2023-04-29 11:26:47,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +36: [2023-04-29 11:26:47,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 11:26:47,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +55: [2023-04-29 11:26:47,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +31: [2023-04-29 11:26:47,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +31: [2023-04-29 11:26:47,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +42: [2023-04-29 11:26:47,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 11:26:47,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 11:26:47,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +30: [2023-04-29 11:26:47,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 11:26:47,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 11:26:47,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +34: [2023-04-29 11:26:47,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 3: [2023-04-29 11:26:47,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +47: [2023-04-29 11:26:47,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 11:26:47,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +30: [2023-04-29 11:26:47,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +55: [2023-04-29 11:26:47,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 11:26:47,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 11:26:47,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +46: [2023-04-29 11:26:47,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 11:26:47,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +27: [2023-04-29 11:26:47,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 11:26:47,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +62: [2023-04-29 11:26:47,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +22: [2023-04-29 11:26:47,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +62: [2023-04-29 11:26:47,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +27: [2023-04-29 11:26:47,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +27: [2023-04-29 11:26:47,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +21: [2023-04-29 11:26:47,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +46: [2023-04-29 11:26:47,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 11:26:47,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 11:26:47,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 3: [2023-04-29 11:26:47,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +56: [2023-04-29 11:26:47,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +30: [2023-04-29 11:26:47,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 11:26:47,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +46: [2023-04-29 11:26:47,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +46: [2023-04-29 11:26:47,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +30: [2023-04-29 11:26:47,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 11:26:47,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +62: [2023-04-29 11:26:47,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 11:26:47,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 11:26:47,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 11:26:47,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:47,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +42: [2023-04-29 11:26:47,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +22: [2023-04-29 11:26:47,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +56: [2023-04-29 11:26:47,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 11:26:47,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 11:26:47,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 11:26:47,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 11:26:47,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +21: [2023-04-29 11:26:47,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +43: [2023-04-29 11:26:47,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 11:26:47,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 11:26:47,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +51: [2023-04-29 11:26:47,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +51: [2023-04-29 11:26:47,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +52: [2023-04-29 11:26:47,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +51: [2023-04-29 11:26:47,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. + 6: [2023-04-29 11:26:47,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 11:26:47,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. + 6: [2023-04-29 11:26:47,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 11:26:47,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 11:26:47,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +21: [2023-04-29 11:26:47,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +61: [2023-04-29 11:26:47,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +22: [2023-04-29 11:26:47,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +52: [2023-04-29 11:26:47,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 11:26:47,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 11:26:47,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 11:26:47,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +53: [2023-04-29 11:26:47,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +60: [2023-04-29 11:26:47,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +60: [2023-04-29 11:26:47,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +33: [2023-04-29 11:26:47,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +33: [2023-04-29 11:26:47,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +60: [2023-04-29 11:26:47,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 11:26:47,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 6: [2023-04-29 11:26:47,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +33: [2023-04-29 11:26:47,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 6: [2023-04-29 11:26:47,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 11:26:47,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 11:26:47,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +13: [2023-04-29 11:26:47,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +52: [2023-04-29 11:26:47,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +13: [2023-04-29 11:26:47,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +47: [2023-04-29 11:26:47,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +47: [2023-04-29 11:26:47,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +47: [2023-04-29 11:26:47,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +13: [2023-04-29 11:26:47,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +47: [2023-04-29 11:26:47,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +22: [2023-04-29 11:26:47,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +21: [2023-04-29 11:26:47,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +21: [2023-04-29 11:26:47,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 2: [2023-04-29 11:26:47,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +61: [2023-04-29 11:26:47,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +53: [2023-04-29 11:26:47,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +61: [2023-04-29 11:26:47,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +22: [2023-04-29 11:26:47,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +37: [2023-04-29 11:26:47,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +25: [2023-04-29 11:26:47,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +25: [2023-04-29 11:26:47,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +60: [2023-04-29 11:26:47,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +25: [2023-04-29 11:26:47,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +25: [2023-04-29 11:26:47,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +49: [2023-04-29 11:26:47,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 11:26:47,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +21: [2023-04-29 11:26:47,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +47: [2023-04-29 11:26:47,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +37: [2023-04-29 11:26:47,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. + 5: [2023-04-29 11:26:47,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +49: [2023-04-29 11:26:47,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 11:26:47,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +60: [2023-04-29 11:26:47,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 11:26:47,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 11:26:47,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +58: [2023-04-29 11:26:47,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +58: [2023-04-29 11:26:47,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +58: [2023-04-29 11:26:47,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +28: [2023-04-29 11:26:47,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 2: [2023-04-29 11:26:47,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 2: [2023-04-29 11:26:47,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 2: [2023-04-29 11:26:47,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 2: [2023-04-29 11:26:47,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +53: [2023-04-29 11:26:47,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +28: [2023-04-29 11:26:47,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +41: [2023-04-29 11:26:47,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 11:26:47,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 11:26:47,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +60: [2023-04-29 11:26:47,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +28: [2023-04-29 11:26:47,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +28: [2023-04-29 11:26:47,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +42: [2023-04-29 11:26:47,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 11:26:47,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +28: [2023-04-29 11:26:47,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +53: [2023-04-29 11:26:47,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +53: [2023-04-29 11:26:47,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 11:26:47,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 11:26:47,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 11:26:47,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +28: [2023-04-29 11:26:47,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +28: [2023-04-29 11:26:47,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +51: [2023-04-29 11:26:47,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +28: [2023-04-29 11:26:47,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +41: [2023-04-29 11:26:47,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 11:26:47,919] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 11:26:47,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 11:26:47,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +20: [2023-04-29 11:26:47,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +20: [2023-04-29 11:26:47,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +20: [2023-04-29 11:26:47,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +20: [2023-04-29 11:26:47,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_14-model_01-model_states.pt. +33: [2023-04-29 11:26:47,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +11: [2023-04-29 11:26:47,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +45: [2023-04-29 11:26:47,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:47,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 11:26:47,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 11:26:47,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:47,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 11:26:47,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 11:26:47,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +45: [2023-04-29 11:26:47,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 11:26:47,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 11:26:47,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 11:26:47,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 11:26:47,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +54: [2023-04-29 11:26:47,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 11:26:47,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 11:26:47,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 11:26:47,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 11:26:47,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 11:26:47,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 11:26:47,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 11:26:47,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 11:26:47,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +47: [2023-04-29 11:26:47,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +13: [2023-04-29 11:26:47,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 11:26:47,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +11: [2023-04-29 11:26:47,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +54: [2023-04-29 11:26:47,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +47: [2023-04-29 11:26:47,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 11:26:47,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +25: [2023-04-29 11:26:47,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +45: [2023-04-29 11:26:47,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +54: [2023-04-29 11:26:47,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +45: [2023-04-29 11:26:47,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +13: [2023-04-29 11:26:47,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +54: [2023-04-29 11:26:47,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +54: [2023-04-29 11:26:47,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +46: [2023-04-29 11:26:47,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +46: [2023-04-29 11:26:47,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +46: [2023-04-29 11:26:47,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +36: [2023-04-29 11:26:47,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +46: [2023-04-29 11:26:47,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +54: [2023-04-29 11:26:47,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +13: [2023-04-29 11:26:47,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +45: [2023-04-29 11:26:47,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +25: [2023-04-29 11:26:47,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +25: [2023-04-29 11:26:47,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +60: [2023-04-29 11:26:47,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +13: [2023-04-29 11:26:47,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +40: [2023-04-29 11:26:47,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +40: [2023-04-29 11:26:47,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +37: [2023-04-29 11:26:47,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +45: [2023-04-29 11:26:47,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +43: [2023-04-29 11:26:47,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 11:26:47,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... + 5: [2023-04-29 11:26:47,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +12: [2023-04-29 11:26:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +12: [2023-04-29 11:26:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +43: [2023-04-29 11:26:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 11:26:47,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +54: [2023-04-29 11:26:47,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +12: [2023-04-29 11:26:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +60: [2023-04-29 11:26:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 11:26:47,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +12: [2023-04-29 11:26:47,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +40: [2023-04-29 11:26:47,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 0: [2023-04-29 11:26:47,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +40: [2023-04-29 11:26:47,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 4: [2023-04-29 11:26:47,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 11:26:47,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +41: [2023-04-29 11:26:47,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 11:26:47,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 11:26:47,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 11:26:47,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 11:26:47,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +36: [2023-04-29 11:26:47,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +62: [2023-04-29 11:26:47,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +12: [2023-04-29 11:26:47,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +62: [2023-04-29 11:26:47,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 0: [2023-04-29 11:26:47,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +62: [2023-04-29 11:26:47,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 11:26:47,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 11:26:47,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +12: [2023-04-29 11:26:47,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +12: [2023-04-29 11:26:47,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 11:26:47,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +12: [2023-04-29 11:26:47,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +36: [2023-04-29 11:26:47,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 11:26:47,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +51: [2023-04-29 11:26:47,941] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 11:26:47,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +60: [2023-04-29 11:26:47,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 11:26:47,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +62: [2023-04-29 11:26:47,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 11:26:47,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 11:26:47,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 11:26:47,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 11:26:47,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +27: [2023-04-29 11:26:47,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 11:26:47,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +43: [2023-04-29 11:26:47,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 11:26:47,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 11:26:47,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +20: [2023-04-29 11:26:47,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +11: [2023-04-29 11:26:47,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 11:26:47,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +41: [2023-04-29 11:26:47,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 11:26:47,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 11:26:47,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +30: [2023-04-29 11:26:47,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +37: [2023-04-29 11:26:47,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +27: [2023-04-29 11:26:47,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +27: [2023-04-29 11:26:47,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +11: [2023-04-29 11:26:47,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +11: [2023-04-29 11:26:47,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +62: [2023-04-29 11:26:47,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +27: [2023-04-29 11:26:47,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +27: [2023-04-29 11:26:47,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +41: [2023-04-29 11:26:47,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 11:26:47,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 11:26:47,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 11:26:47,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +20: [2023-04-29 11:26:47,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +20: [2023-04-29 11:26:47,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt... +51: [2023-04-29 11:26:47,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +30: [2023-04-29 11:26:47,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 11:26:47,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 11:26:47,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 11:26:47,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 11:26:47,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +60: [2023-04-29 11:26:47,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +27: [2023-04-29 11:26:47,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +27: [2023-04-29 11:26:47,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 1: [2023-04-29 11:26:47,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +62: [2023-04-29 11:26:47,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +62: [2023-04-29 11:26:47,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 11:26:47,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... + 1: [2023-04-29 11:26:47,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +46: [2023-04-29 11:26:47,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 11:26:47,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +11: [2023-04-29 11:26:47,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +46: [2023-04-29 11:26:47,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 11:26:47,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +40: [2023-04-29 11:26:47,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +11: [2023-04-29 11:26:47,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +40: [2023-04-29 11:26:47,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 11:26:47,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +40: [2023-04-29 11:26:47,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +11: [2023-04-29 11:26:47,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +37: [2023-04-29 11:26:47,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +37: [2023-04-29 11:26:47,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +43: [2023-04-29 11:26:47,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 11:26:47,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 11:26:47,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 11:26:47,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 11:26:47,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +40: [2023-04-29 11:26:47,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 11:26:47,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +60: [2023-04-29 11:26:47,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 11:26:47,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 11:26:47,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +43: [2023-04-29 11:26:47,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +43: [2023-04-29 11:26:47,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 4: [2023-04-29 11:26:47,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +43: [2023-04-29 11:26:47,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +43: [2023-04-29 11:26:47,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +51: [2023-04-29 11:26:47,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 4: [2023-04-29 11:26:47,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +43: [2023-04-29 11:26:47,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +43: [2023-04-29 11:26:47,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +60: [2023-04-29 11:26:47,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 11:26:47,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +30: [2023-04-29 11:26:47,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 11:26:47,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 11:26:47,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 11:26:47,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 11:26:47,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +54: [2023-04-29 11:26:47,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +15: [2023-04-29 11:26:47,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +51: [2023-04-29 11:26:47,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +15: [2023-04-29 11:26:47,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 11:26:47,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 11:26:47,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 11:26:47,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 11:26:47,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +47: [2023-04-29 11:26:47,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 11:26:47,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +30: [2023-04-29 11:26:47,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 11:26:47,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +54: [2023-04-29 11:26:47,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:47,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 6: [2023-04-29 11:26:47,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +51: [2023-04-29 11:26:47,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +58: [2023-04-29 11:26:47,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 11:26:47,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +25: [2023-04-29 11:26:47,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +51: [2023-04-29 11:26:47,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 11:26:47,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +54: [2023-04-29 11:26:47,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 11:26:47,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +47: [2023-04-29 11:26:47,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +13: [2023-04-29 11:26:47,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 11:26:47,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 11:26:47,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 6: [2023-04-29 11:26:47,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 5: [2023-04-29 11:26:47,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 11:26:47,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +45: [2023-04-29 11:26:47,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +25: [2023-04-29 11:26:47,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 11:26:47,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +47: [2023-04-29 11:26:47,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... + 6: [2023-04-29 11:26:47,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +58: [2023-04-29 11:26:47,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +45: [2023-04-29 11:26:47,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +51: [2023-04-29 11:26:47,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +51: [2023-04-29 11:26:47,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +47: [2023-04-29 11:26:47,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +45: [2023-04-29 11:26:47,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +12: [2023-04-29 11:26:47,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +12: [2023-04-29 11:26:47,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 11:26:47,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +13: [2023-04-29 11:26:48,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +25: [2023-04-29 11:26:48,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +13: [2023-04-29 11:26:48,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 0: [2023-04-29 11:26:48,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 11:26:48,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +51: [2023-04-29 11:26:48,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +13: [2023-04-29 11:26:48,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +13: [2023-04-29 11:26:48,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +58: [2023-04-29 11:26:48,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +58: [2023-04-29 11:26:48,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +12: [2023-04-29 11:26:48,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +12: [2023-04-29 11:26:48,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 11:26:48,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 11:26:48,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +62: [2023-04-29 11:26:48,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 11:26:48,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +51: [2023-04-29 11:26:48,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +13: [2023-04-29 11:26:48,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 5: [2023-04-29 11:26:48,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +54: [2023-04-29 11:26:48,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +23: [2023-04-29 11:26:48,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 11:26:48,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +23: [2023-04-29 11:26:48,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +58: [2023-04-29 11:26:48,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +58: [2023-04-29 11:26:48,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +23: [2023-04-29 11:26:48,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 11:26:48,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +20: [2023-04-29 11:26:48,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +54: [2023-04-29 11:26:48,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +58: [2023-04-29 11:26:48,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +23: [2023-04-29 11:26:48,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +23: [2023-04-29 11:26:48,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +62: [2023-04-29 11:26:48,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +62: [2023-04-29 11:26:48,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +54: [2023-04-29 11:26:48,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +45: [2023-04-29 11:26:48,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +20: [2023-04-29 11:26:48,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +62: [2023-04-29 11:26:48,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +20: [2023-04-29 11:26:48,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +54: [2023-04-29 11:26:48,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +58: [2023-04-29 11:26:48,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +46: [2023-04-29 11:26:48,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +48: [2023-04-29 11:26:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +48: [2023-04-29 11:26:48,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +48: [2023-04-29 11:26:48,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +45: [2023-04-29 11:26:48,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 11:26:48,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +20: [2023-04-29 11:26:48,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 1: [2023-04-29 11:26:48,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +20: [2023-04-29 11:26:48,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +33: [2023-04-29 11:26:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 11:26:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 11:26:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 11:26:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 11:26:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 11:26:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 11:26:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 11:26:48,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 11:26:48,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +12: [2023-04-29 11:26:48,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 11:26:48,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 11:26:48,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 11:26:48,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 11:26:48,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +46: [2023-04-29 11:26:48,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 11:26:48,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +20: [2023-04-29 11:26:48,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_00-model_states.pt. +33: [2023-04-29 11:26:48,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +33: [2023-04-29 11:26:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +20: [2023-04-29 11:26:48,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... +62: [2023-04-29 11:26:48,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +46: [2023-04-29 11:26:48,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 11:26:48,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +33: [2023-04-29 11:26:48,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +33: [2023-04-29 11:26:48,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +46: [2023-04-29 11:26:48,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +33: [2023-04-29 11:26:48,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +33: [2023-04-29 11:26:48,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +54: [2023-04-29 11:26:48,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +20: [2023-04-29 11:26:48,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt... + 0: [2023-04-29 11:26:48,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 11:26:48,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 11:26:48,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +46: [2023-04-29 11:26:48,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +46: [2023-04-29 11:26:48,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... + 0: [2023-04-29 11:26:48,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +62: [2023-04-29 11:26:48,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +62: [2023-04-29 11:26:48,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +62: [2023-04-29 11:26:48,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +15: [2023-04-29 11:26:48,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 11:26:48,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +48: [2023-04-29 11:26:48,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +48: [2023-04-29 11:26:48,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +48: [2023-04-29 11:26:48,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +15: [2023-04-29 11:26:48,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 11:26:48,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +48: [2023-04-29 11:26:48,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +34: [2023-04-29 11:26:48,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +34: [2023-04-29 11:26:48,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +34: [2023-04-29 11:26:48,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +34: [2023-04-29 11:26:48,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 1: [2023-04-29 11:26:48,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 11:26:48,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:48,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:48,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 11:26:48,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 11:26:48,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 11:26:48,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 11:26:48,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 11:26:48,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 11:26:48,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 11:26:48,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 11:26:48,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 11:26:48,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 11:26:48,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +18: [2023-04-29 11:26:48,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 11:26:48,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +18: [2023-04-29 11:26:48,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 11:26:48,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 11:26:48,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 11:26:48,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +55: [2023-04-29 11:26:48,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +55: [2023-04-29 11:26:48,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +55: [2023-04-29 11:26:48,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +55: [2023-04-29 11:26:48,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +15: [2023-04-29 11:26:48,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 11:26:48,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 11:26:48,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 11:26:48,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 11:26:48,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 11:26:48,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 11:26:48,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +34: [2023-04-29 11:26:48,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:48,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +23: [2023-04-29 11:26:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +24: [2023-04-29 11:26:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +24: [2023-04-29 11:26:48,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +24: [2023-04-29 11:26:48,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +24: [2023-04-29 11:26:48,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +29: [2023-04-29 11:26:48,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +50: [2023-04-29 11:26:48,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +50: [2023-04-29 11:26:48,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +50: [2023-04-29 11:26:48,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +29: [2023-04-29 11:26:48,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +50: [2023-04-29 11:26:48,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +29: [2023-04-29 11:26:48,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 11:26:48,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +52: [2023-04-29 11:26:48,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +52: [2023-04-29 11:26:48,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +33: [2023-04-29 11:26:48,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 11:26:48,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +52: [2023-04-29 11:26:48,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +23: [2023-04-29 11:26:48,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +34: [2023-04-29 11:26:48,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:48,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 11:26:48,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 11:26:48,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 11:26:48,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 11:26:48,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 11:26:48,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 11:26:48,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 11:26:48,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 11:26:48,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 11:26:48,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +32: [2023-04-29 11:26:48,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +33: [2023-04-29 11:26:48,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 11:26:48,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +32: [2023-04-29 11:26:48,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +40: [2023-04-29 11:26:48,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 11:26:48,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +40: [2023-04-29 11:26:48,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +33: [2023-04-29 11:26:48,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 11:26:48,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +24: [2023-04-29 11:26:48,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +24: [2023-04-29 11:26:48,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +40: [2023-04-29 11:26:48,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +40: [2023-04-29 11:26:48,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 11:26:48,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 11:26:48,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 11:26:48,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +38: [2023-04-29 11:26:48,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +38: [2023-04-29 11:26:48,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +38: [2023-04-29 11:26:48,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +24: [2023-04-29 11:26:48,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +24: [2023-04-29 11:26:48,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +24: [2023-04-29 11:26:48,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +24: [2023-04-29 11:26:48,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +55: [2023-04-29 11:26:48,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +55: [2023-04-29 11:26:48,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 11:26:48,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 11:26:48,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +53: [2023-04-29 11:26:48,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +53: [2023-04-29 11:26:48,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +24: [2023-04-29 11:26:48,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +53: [2023-04-29 11:26:48,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +55: [2023-04-29 11:26:48,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +24: [2023-04-29 11:26:48,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +24: [2023-04-29 11:26:48,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +23: [2023-04-29 11:26:48,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 1: [2023-04-29 11:26:48,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 1: [2023-04-29 11:26:48,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 1: [2023-04-29 11:26:48,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +55: [2023-04-29 11:26:48,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 11:26:48,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 11:26:48,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +23: [2023-04-29 11:26:48,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +50: [2023-04-29 11:26:48,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +23: [2023-04-29 11:26:48,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +50: [2023-04-29 11:26:48,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 11:26:48,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 11:26:48,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +19: [2023-04-29 11:26:48,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 11:26:48,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 11:26:48,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +32: [2023-04-29 11:26:48,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +19: [2023-04-29 11:26:48,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +52: [2023-04-29 11:26:48,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 11:26:48,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +36: [2023-04-29 11:26:48,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +36: [2023-04-29 11:26:48,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +61: [2023-04-29 11:26:48,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +61: [2023-04-29 11:26:48,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +33: [2023-04-29 11:26:48,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +23: [2023-04-29 11:26:48,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 11:26:48,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 11:26:48,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +36: [2023-04-29 11:26:48,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +33: [2023-04-29 11:26:48,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +19: [2023-04-29 11:26:48,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 11:26:48,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 11:26:48,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 11:26:48,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +61: [2023-04-29 11:26:48,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +61: [2023-04-29 11:26:48,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +24: [2023-04-29 11:26:48,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +39: [2023-04-29 11:26:48,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 11:26:48,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +24: [2023-04-29 11:26:48,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +39: [2023-04-29 11:26:48,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +25: [2023-04-29 11:26:48,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 11:26:48,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +39: [2023-04-29 11:26:48,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +25: [2023-04-29 11:26:48,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 11:26:48,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +32: [2023-04-29 11:26:48,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +24: [2023-04-29 11:26:48,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +44: [2023-04-29 11:26:48,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +44: [2023-04-29 11:26:48,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +38: [2023-04-29 11:26:48,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +44: [2023-04-29 11:26:48,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +44: [2023-04-29 11:26:48,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. + 3: [2023-04-29 11:26:48,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +38: [2023-04-29 11:26:48,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +39: [2023-04-29 11:26:48,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 11:26:48,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 11:26:48,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +25: [2023-04-29 11:26:48,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +25: [2023-04-29 11:26:48,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +39: [2023-04-29 11:26:48,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 11:26:48,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 11:26:48,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +38: [2023-04-29 11:26:48,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 11:26:48,130] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 11:26:48,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +45: [2023-04-29 11:26:48,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +38: [2023-04-29 11:26:48,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +45: [2023-04-29 11:26:48,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +11: [2023-04-29 11:26:48,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +45: [2023-04-29 11:26:48,131] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. + 9: [2023-04-29 11:26:48,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +20: [2023-04-29 11:26:48,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +20: [2023-04-29 11:26:48,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +63: [2023-04-29 11:26:48,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 11:26:48,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +18: [2023-04-29 11:26:48,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +53: [2023-04-29 11:26:48,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +20: [2023-04-29 11:26:48,136] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +20: [2023-04-29 11:26:48,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +63: [2023-04-29 11:26:48,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 11:26:48,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 11:26:48,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 11:26:48,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +53: [2023-04-29 11:26:48,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +63: [2023-04-29 11:26:48,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +53: [2023-04-29 11:26:48,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +63: [2023-04-29 11:26:48,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 11:26:48,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +37: [2023-04-29 11:26:48,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +37: [2023-04-29 11:26:48,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +20: [2023-04-29 11:26:48,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +33: [2023-04-29 11:26:48,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +20: [2023-04-29 11:26:48,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +37: [2023-04-29 11:26:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +37: [2023-04-29 11:26:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +20: [2023-04-29 11:26:48,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +18: [2023-04-29 11:26:48,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +63: [2023-04-29 11:26:48,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +11: [2023-04-29 11:26:48,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:48,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:48,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 11:26:48,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +63: [2023-04-29 11:26:48,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +18: [2023-04-29 11:26:48,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 11:26:48,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +61: [2023-04-29 11:26:48,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 11:26:48,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +61: [2023-04-29 11:26:48,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 11:26:48,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 11:26:48,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 11:26:48,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 11:26:48,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 11:26:48,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 11:26:48,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 11:26:48,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 11:26:48,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 11:26:48,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 11:26:48,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 11:26:48,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +61: [2023-04-29 11:26:48,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +27: [2023-04-29 11:26:48,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +27: [2023-04-29 11:26:48,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +27: [2023-04-29 11:26:48,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +44: [2023-04-29 11:26:48,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +27: [2023-04-29 11:26:48,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 11:26:48,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +44: [2023-04-29 11:26:48,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +11: [2023-04-29 11:26:48,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +36: [2023-04-29 11:26:48,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 11:26:48,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +28: [2023-04-29 11:26:48,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 11:26:48,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 11:26:48,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 11:26:48,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +26: [2023-04-29 11:26:48,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +26: [2023-04-29 11:26:48,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +58: [2023-04-29 11:26:48,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 11:26:48,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 11:26:48,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +18: [2023-04-29 11:26:48,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +58: [2023-04-29 11:26:48,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 11:26:48,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 11:26:48,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:48,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +27: [2023-04-29 11:26:48,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +27: [2023-04-29 11:26:48,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +45: [2023-04-29 11:26:48,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +31: [2023-04-29 11:26:48,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 11:26:48,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +14: [2023-04-29 11:26:48,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +27: [2023-04-29 11:26:48,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 11:26:48,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 11:26:48,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +31: [2023-04-29 11:26:48,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 11:26:48,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 11:26:48,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +26: [2023-04-29 11:26:48,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +27: [2023-04-29 11:26:48,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 11:26:48,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 11:26:48,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +45: [2023-04-29 11:26:48,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +26: [2023-04-29 11:26:48,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 11:26:48,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 11:26:48,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 11:26:48,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 11:26:48,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 11:26:48,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 11:26:48,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 11:26:48,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 11:26:48,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 11:26:48,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 11:26:48,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +26: [2023-04-29 11:26:48,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +38: [2023-04-29 11:26:48,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:48,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +28: [2023-04-29 11:26:48,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +32: [2023-04-29 11:26:48,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +14: [2023-04-29 11:26:48,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +38: [2023-04-29 11:26:48,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +14: [2023-04-29 11:26:48,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 7: [2023-04-29 11:26:48,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 11:26:48,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 11:26:48,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 11:26:48,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 11:26:48,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 11:26:48,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +26: [2023-04-29 11:26:48,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 11:26:48,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 11:26:48,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... + 8: [2023-04-29 11:26:48,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +41: [2023-04-29 11:26:48,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +41: [2023-04-29 11:26:48,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +41: [2023-04-29 11:26:48,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +41: [2023-04-29 11:26:48,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +48: [2023-04-29 11:26:48,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +31: [2023-04-29 11:26:48,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 11:26:48,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +38: [2023-04-29 11:26:48,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +48: [2023-04-29 11:26:48,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +31: [2023-04-29 11:26:48,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 11:26:48,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +40: [2023-04-29 11:26:48,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 11:26:48,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +24: [2023-04-29 11:26:48,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +24: [2023-04-29 11:26:48,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +48: [2023-04-29 11:26:48,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... + 3: [2023-04-29 11:26:48,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +48: [2023-04-29 11:26:48,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 11:26:48,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +52: [2023-04-29 11:26:48,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 11:26:48,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +18: [2023-04-29 11:26:48,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +50: [2023-04-29 11:26:48,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 11:26:48,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 11:26:48,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 11:26:48,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +38: [2023-04-29 11:26:48,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 11:26:48,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +40: [2023-04-29 11:26:48,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 11:26:48,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 11:26:48,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 11:26:48,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 11:26:48,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +52: [2023-04-29 11:26:48,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 11:26:48,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +34: [2023-04-29 11:26:48,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 11:26:48,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 11:26:48,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 11:26:48,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 11:26:48,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 11:26:48,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 11:26:48,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 11:26:48,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 11:26:48,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 11:26:48,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 11:26:48,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +53: [2023-04-29 11:26:48,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 11:26:48,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +11: [2023-04-29 11:26:48,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 11:26:48,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +53: [2023-04-29 11:26:48,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 11:26:48,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +11: [2023-04-29 11:26:48,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 11:26:48,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 11:26:48,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 11:26:48,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +37: [2023-04-29 11:26:48,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 11:26:48,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +24: [2023-04-29 11:26:48,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +52: [2023-04-29 11:26:48,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +38: [2023-04-29 11:26:48,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +21: [2023-04-29 11:26:48,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +38: [2023-04-29 11:26:48,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 11:26:48,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 11:26:48,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 11:26:48,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 11:26:48,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 11:26:48,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 11:26:48,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 11:26:48,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 11:26:48,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 11:26:48,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 11:26:48,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +29: [2023-04-29 11:26:48,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +55: [2023-04-29 11:26:48,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 11:26:48,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 11:26:48,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 11:26:48,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +25: [2023-04-29 11:26:48,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +50: [2023-04-29 11:26:48,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:48,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +55: [2023-04-29 11:26:48,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +34: [2023-04-29 11:26:48,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +53: [2023-04-29 11:26:48,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +53: [2023-04-29 11:26:48,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 11:26:48,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +19: [2023-04-29 11:26:48,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +53: [2023-04-29 11:26:48,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +21: [2023-04-29 11:26:48,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +53: [2023-04-29 11:26:48,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +21: [2023-04-29 11:26:48,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +21: [2023-04-29 11:26:48,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 11:26:48,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 11:26:48,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +21: [2023-04-29 11:26:48,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +55: [2023-04-29 11:26:48,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +10: [2023-04-29 11:26:48,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 11:26:48,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 11:26:48,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 11:26:48,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 11:26:48,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 11:26:48,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +52: [2023-04-29 11:26:48,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +52: [2023-04-29 11:26:48,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +50: [2023-04-29 11:26:48,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 11:26:48,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 11:26:48,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 11:26:48,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +55: [2023-04-29 11:26:48,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +55: [2023-04-29 11:26:48,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 11:26:48,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +61: [2023-04-29 11:26:48,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:48,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +19: [2023-04-29 11:26:48,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +55: [2023-04-29 11:26:48,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 11:26:48,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +32: [2023-04-29 11:26:48,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +34: [2023-04-29 11:26:48,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:48,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:48,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +55: [2023-04-29 11:26:48,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 11:26:48,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +14: [2023-04-29 11:26:48,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +14: [2023-04-29 11:26:48,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +10: [2023-04-29 11:26:48,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 11:26:48,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 11:26:48,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 11:26:48,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +50: [2023-04-29 11:26:48,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +50: [2023-04-29 11:26:48,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +17: [2023-04-29 11:26:48,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +14: [2023-04-29 11:26:48,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +47: [2023-04-29 11:26:48,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +47: [2023-04-29 11:26:48,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +19: [2023-04-29 11:26:48,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 11:26:48,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 11:26:48,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 11:26:48,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +52: [2023-04-29 11:26:48,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +47: [2023-04-29 11:26:48,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +39: [2023-04-29 11:26:48,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 11:26:48,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +10: [2023-04-29 11:26:48,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 11:26:48,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 11:26:48,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +50: [2023-04-29 11:26:48,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +50: [2023-04-29 11:26:48,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +29: [2023-04-29 11:26:48,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +14: [2023-04-29 11:26:48,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +55: [2023-04-29 11:26:48,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +41: [2023-04-29 11:26:48,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 11:26:48,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +41: [2023-04-29 11:26:48,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +50: [2023-04-29 11:26:48,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +24: [2023-04-29 11:26:48,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +63: [2023-04-29 11:26:48,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +63: [2023-04-29 11:26:48,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +63: [2023-04-29 11:26:48,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +25: [2023-04-29 11:26:48,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +63: [2023-04-29 11:26:48,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +24: [2023-04-29 11:26:48,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +55: [2023-04-29 11:26:48,196] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +55: [2023-04-29 11:26:48,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +53: [2023-04-29 11:26:48,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 11:26:48,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 11:26:48,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 11:26:48,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 11:26:48,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 11:26:48,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 11:26:48,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 11:26:48,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +16: [2023-04-29 11:26:48,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +16: [2023-04-29 11:26:48,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +16: [2023-04-29 11:26:48,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +46: [2023-04-29 11:26:48,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +16: [2023-04-29 11:26:48,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +41: [2023-04-29 11:26:48,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +41: [2023-04-29 11:26:48,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +53: [2023-04-29 11:26:48,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +38: [2023-04-29 11:26:48,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +55: [2023-04-29 11:26:48,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +53: [2023-04-29 11:26:48,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +24: [2023-04-29 11:26:48,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 11:26:48,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 11:26:48,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +16: [2023-04-29 11:26:48,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +44: [2023-04-29 11:26:48,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 11:26:48,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +57: [2023-04-29 11:26:48,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +57: [2023-04-29 11:26:48,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +46: [2023-04-29 11:26:48,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +16: [2023-04-29 11:26:48,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 11:26:48,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +46: [2023-04-29 11:26:48,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 11:26:48,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +38: [2023-04-29 11:26:48,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +40: [2023-04-29 11:26:48,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +20: [2023-04-29 11:26:48,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +20: [2023-04-29 11:26:48,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +24: [2023-04-29 11:26:48,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +46: [2023-04-29 11:26:48,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +63: [2023-04-29 11:26:48,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 11:26:48,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +20: [2023-04-29 11:26:48,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +53: [2023-04-29 11:26:48,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +25: [2023-04-29 11:26:48,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +38: [2023-04-29 11:26:48,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +40: [2023-04-29 11:26:48,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 11:26:48,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +38: [2023-04-29 11:26:48,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 11:26:48,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 11:26:48,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +57: [2023-04-29 11:26:48,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. + 1: [2023-04-29 11:26:48,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +38: [2023-04-29 11:26:48,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +38: [2023-04-29 11:26:48,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +25: [2023-04-29 11:26:48,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +38: [2023-04-29 11:26:48,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +47: [2023-04-29 11:26:48,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 11:26:48,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 11:26:48,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +56: [2023-04-29 11:26:48,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 11:26:48,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 11:26:48,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 7: [2023-04-29 11:26:48,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 7: [2023-04-29 11:26:48,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 7: [2023-04-29 11:26:48,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +19: [2023-04-29 11:26:48,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +19: [2023-04-29 11:26:48,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 11:26:48,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +53: [2023-04-29 11:26:48,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 11:26:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +15: [2023-04-29 11:26:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +15: [2023-04-29 11:26:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +15: [2023-04-29 11:26:48,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 9: [2023-04-29 11:26:48,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 11:26:48,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +56: [2023-04-29 11:26:48,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +24: [2023-04-29 11:26:48,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +56: [2023-04-29 11:26:48,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +19: [2023-04-29 11:26:48,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 11:26:48,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 11:26:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +19: [2023-04-29 11:26:48,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +47: [2023-04-29 11:26:48,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +19: [2023-04-29 11:26:48,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +58: [2023-04-29 11:26:48,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +58: [2023-04-29 11:26:48,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +58: [2023-04-29 11:26:48,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +19: [2023-04-29 11:26:48,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +19: [2023-04-29 11:26:48,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +58: [2023-04-29 11:26:48,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +10: [2023-04-29 11:26:48,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +53: [2023-04-29 11:26:48,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +10: [2023-04-29 11:26:48,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +10: [2023-04-29 11:26:48,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +61: [2023-04-29 11:26:48,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +10: [2023-04-29 11:26:48,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +44: [2023-04-29 11:26:48,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +44: [2023-04-29 11:26:48,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 11:26:48,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +24: [2023-04-29 11:26:48,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 11:26:48,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +25: [2023-04-29 11:26:48,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +56: [2023-04-29 11:26:48,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +31: [2023-04-29 11:26:48,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 11:26:48,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +51: [2023-04-29 11:26:48,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +53: [2023-04-29 11:26:48,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +27: [2023-04-29 11:26:48,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 11:26:48,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +24: [2023-04-29 11:26:48,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +39: [2023-04-29 11:26:48,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 11:26:48,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 11:26:48,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 11:26:48,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +58: [2023-04-29 11:26:48,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +51: [2023-04-29 11:26:48,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +51: [2023-04-29 11:26:48,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +63: [2023-04-29 11:26:48,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 11:26:48,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 11:26:48,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +59: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +59: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +39: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +51: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +28: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +44: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +63: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +26: [2023-04-29 11:26:48,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +26: [2023-04-29 11:26:48,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +46: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +46: [2023-04-29 11:26:48,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +38: [2023-04-29 11:26:48,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:48,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +31: [2023-04-29 11:26:48,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +24: [2023-04-29 11:26:48,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +61: [2023-04-29 11:26:48,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +63: [2023-04-29 11:26:48,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +63: [2023-04-29 11:26:48,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +63: [2023-04-29 11:26:48,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +26: [2023-04-29 11:26:48,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +45: [2023-04-29 11:26:48,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 11:26:48,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +46: [2023-04-29 11:26:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +46: [2023-04-29 11:26:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +45: [2023-04-29 11:26:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 11:26:48,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 11:26:48,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +51: [2023-04-29 11:26:48,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +24: [2023-04-29 11:26:48,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 11:26:48,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +27: [2023-04-29 11:26:48,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +27: [2023-04-29 11:26:48,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 11:26:48,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +24: [2023-04-29 11:26:48,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +20: [2023-04-29 11:26:48,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 11:26:48,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +61: [2023-04-29 11:26:48,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... + 9: [2023-04-29 11:26:48,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +61: [2023-04-29 11:26:48,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +44: [2023-04-29 11:26:48,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +20: [2023-04-29 11:26:48,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +63: [2023-04-29 11:26:48,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 11:26:48,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 11:26:48,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 11:26:48,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +58: [2023-04-29 11:26:48,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 11:26:48,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 11:26:48,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 11:26:48,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 11:26:48,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 11:26:48,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +26: [2023-04-29 11:26:48,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 4: [2023-04-29 11:26:48,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 4: [2023-04-29 11:26:48,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +26: [2023-04-29 11:26:48,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +51: [2023-04-29 11:26:48,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 11:26:48,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 11:26:48,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:48,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +45: [2023-04-29 11:26:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +45: [2023-04-29 11:26:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +63: [2023-04-29 11:26:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +20: [2023-04-29 11:26:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 11:26:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +20: [2023-04-29 11:26:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +26: [2023-04-29 11:26:48,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +12: [2023-04-29 11:26:48,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +12: [2023-04-29 11:26:48,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +61: [2023-04-29 11:26:48,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... + 4: [2023-04-29 11:26:48,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +59: [2023-04-29 11:26:48,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +24: [2023-04-29 11:26:48,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +51: [2023-04-29 11:26:48,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +26: [2023-04-29 11:26:48,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 4: [2023-04-29 11:26:48,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +57: [2023-04-29 11:26:48,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 11:26:48,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +59: [2023-04-29 11:26:48,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 11:26:48,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +45: [2023-04-29 11:26:48,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +12: [2023-04-29 11:26:48,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +12: [2023-04-29 11:26:48,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 7: [2023-04-29 11:26:48,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 11:26:48,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 11:26:48,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +28: [2023-04-29 11:26:48,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +34: [2023-04-29 11:26:48,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +31: [2023-04-29 11:26:48,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +32: [2023-04-29 11:26:48,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 11:26:48,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 11:26:48,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 11:26:48,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +19: [2023-04-29 11:26:48,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 11:26:48,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +19: [2023-04-29 11:26:48,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 11:26:48,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 11:26:48,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 11:26:48,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 11:26:48,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 9: [2023-04-29 11:26:48,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 4: [2023-04-29 11:26:48,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +38: [2023-04-29 11:26:48,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +53: [2023-04-29 11:26:48,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +53: [2023-04-29 11:26:48,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +35: [2023-04-29 11:26:48,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +35: [2023-04-29 11:26:48,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +15: [2023-04-29 11:26:48,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +38: [2023-04-29 11:26:48,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 11:26:48,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +10: [2023-04-29 11:26:48,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 11:26:48,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 11:26:48,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 11:26:48,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 11:26:48,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 11:26:48,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +55: [2023-04-29 11:26:48,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +31: [2023-04-29 11:26:48,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 11:26:48,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 11:26:48,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +31: [2023-04-29 11:26:48,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +58: [2023-04-29 11:26:48,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 11:26:48,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +27: [2023-04-29 11:26:48,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +35: [2023-04-29 11:26:48,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +57: [2023-04-29 11:26:48,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 11:26:48,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +28: [2023-04-29 11:26:48,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +35: [2023-04-29 11:26:48,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +15: [2023-04-29 11:26:48,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 11:26:48,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +57: [2023-04-29 11:26:48,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 11:26:48,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 11:26:48,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 11:26:48,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +21: [2023-04-29 11:26:48,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +49: [2023-04-29 11:26:48,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 11:26:48,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +17: [2023-04-29 11:26:48,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +58: [2023-04-29 11:26:48,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 11:26:48,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +28: [2023-04-29 11:26:48,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +58: [2023-04-29 11:26:48,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +58: [2023-04-29 11:26:48,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 11:26:48,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +55: [2023-04-29 11:26:48,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 11:26:48,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +61: [2023-04-29 11:26:48,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 11:26:48,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 11:26:48,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +10: [2023-04-29 11:26:48,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +10: [2023-04-29 11:26:48,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +51: [2023-04-29 11:26:48,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +51: [2023-04-29 11:26:48,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +10: [2023-04-29 11:26:48,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 11:26:48,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +41: [2023-04-29 11:26:48,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +41: [2023-04-29 11:26:48,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +10: [2023-04-29 11:26:48,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +53: [2023-04-29 11:26:48,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 11:26:48,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +57: [2023-04-29 11:26:48,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 11:26:48,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +31: [2023-04-29 11:26:48,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +63: [2023-04-29 11:26:48,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 11:26:48,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +58: [2023-04-29 11:26:48,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 11:26:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +53: [2023-04-29 11:26:48,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +51: [2023-04-29 11:26:48,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 11:26:48,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 11:26:48,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 11:26:48,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 11:26:48,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 11:26:48,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +10: [2023-04-29 11:26:48,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +63: [2023-04-29 11:26:48,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 11:26:48,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:48,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +51: [2023-04-29 11:26:48,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +26: [2023-04-29 11:26:48,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +55: [2023-04-29 11:26:48,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 11:26:48,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +27: [2023-04-29 11:26:48,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +61: [2023-04-29 11:26:48,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +26: [2023-04-29 11:26:48,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +27: [2023-04-29 11:26:48,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +46: [2023-04-29 11:26:48,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +34: [2023-04-29 11:26:48,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 11:26:48,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +27: [2023-04-29 11:26:48,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +41: [2023-04-29 11:26:48,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +48: [2023-04-29 11:26:48,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +28: [2023-04-29 11:26:48,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +43: [2023-04-29 11:26:48,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 11:26:48,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 11:26:48,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 11:26:48,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +17: [2023-04-29 11:26:48,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +55: [2023-04-29 11:26:48,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 11:26:48,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +12: [2023-04-29 11:26:48,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 11:26:48,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +48: [2023-04-29 11:26:48,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 11:26:48,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +43: [2023-04-29 11:26:48,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 11:26:48,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +23: [2023-04-29 11:26:48,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +23: [2023-04-29 11:26:48,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +61: [2023-04-29 11:26:48,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +23: [2023-04-29 11:26:48,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +50: [2023-04-29 11:26:48,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +23: [2023-04-29 11:26:48,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +43: [2023-04-29 11:26:48,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 11:26:48,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 11:26:48,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 11:26:48,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 11:26:48,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 11:26:48,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 11:26:48,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 11:26:48,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 11:26:48,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 11:26:48,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 11:26:48,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 11:26:48,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +12: [2023-04-29 11:26:48,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +26: [2023-04-29 11:26:48,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +12: [2023-04-29 11:26:48,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +12: [2023-04-29 11:26:48,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +34: [2023-04-29 11:26:48,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 11:26:48,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +26: [2023-04-29 11:26:48,271] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 11:26:48,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 11:26:48,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 11:26:48,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +13: [2023-04-29 11:26:48,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +13: [2023-04-29 11:26:48,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +13: [2023-04-29 11:26:48,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 11:26:48,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +13: [2023-04-29 11:26:48,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 11:26:48,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 11:26:48,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 11:26:48,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +16: [2023-04-29 11:26:48,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +48: [2023-04-29 11:26:48,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +26: [2023-04-29 11:26:48,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +55: [2023-04-29 11:26:48,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +30: [2023-04-29 11:26:48,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 11:26:48,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +36: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +36: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +44: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 8: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 9: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +53: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +41: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +36: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +41: [2023-04-29 11:26:48,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +26: [2023-04-29 11:26:48,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 9: [2023-04-29 11:26:48,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +36: [2023-04-29 11:26:48,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +53: [2023-04-29 11:26:48,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 11:26:48,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 11:26:48,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +31: [2023-04-29 11:26:48,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +50: [2023-04-29 11:26:48,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 11:26:48,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +38: [2023-04-29 11:26:48,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +16: [2023-04-29 11:26:48,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 11:26:48,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +38: [2023-04-29 11:26:48,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +30: [2023-04-29 11:26:48,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +43: [2023-04-29 11:26:48,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +43: [2023-04-29 11:26:48,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +43: [2023-04-29 11:26:48,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +60: [2023-04-29 11:26:48,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +60: [2023-04-29 11:26:48,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 11:26:48,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +30: [2023-04-29 11:26:48,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 11:26:48,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +44: [2023-04-29 11:26:48,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +30: [2023-04-29 11:26:48,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 11:26:48,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +13: [2023-04-29 11:26:48,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +44: [2023-04-29 11:26:48,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +13: [2023-04-29 11:26:48,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +60: [2023-04-29 11:26:48,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +10: [2023-04-29 11:26:48,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 11:26:48,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 11:26:48,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +17: [2023-04-29 11:26:48,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +21: [2023-04-29 11:26:48,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 11:26:48,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 11:26:48,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +21: [2023-04-29 11:26:48,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 11:26:48,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +41: [2023-04-29 11:26:48,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... + 8: [2023-04-29 11:26:48,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +46: [2023-04-29 11:26:48,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +55: [2023-04-29 11:26:48,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +21: [2023-04-29 11:26:48,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +44: [2023-04-29 11:26:48,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 11:26:48,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +61: [2023-04-29 11:26:48,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +10: [2023-04-29 11:26:48,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +60: [2023-04-29 11:26:48,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +16: [2023-04-29 11:26:48,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +56: [2023-04-29 11:26:48,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 11:26:48,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 11:26:48,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 11:26:48,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 11:26:48,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 11:26:48,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 11:26:48,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 11:26:48,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 11:26:48,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +61: [2023-04-29 11:26:48,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 11:26:48,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 11:26:48,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 11:26:48,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 11:26:48,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 11:26:48,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 11:26:48,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +17: [2023-04-29 11:26:48,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +42: [2023-04-29 11:26:48,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 11:26:48,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 11:26:48,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +14: [2023-04-29 11:26:48,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +14: [2023-04-29 11:26:48,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 11:26:48,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +16: [2023-04-29 11:26:48,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +10: [2023-04-29 11:26:48,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 11:26:48,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +53: [2023-04-29 11:26:48,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +53: [2023-04-29 11:26:48,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 11:26:48,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 11:26:48,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +55: [2023-04-29 11:26:48,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 11:26:48,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 11:26:48,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 11:26:48,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 11:26:48,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +34: [2023-04-29 11:26:48,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 11:26:48,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +17: [2023-04-29 11:26:48,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +42: [2023-04-29 11:26:48,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +14: [2023-04-29 11:26:48,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 11:26:48,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 11:26:48,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +55: [2023-04-29 11:26:48,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:48,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 11:26:48,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 11:26:48,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +42: [2023-04-29 11:26:48,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +14: [2023-04-29 11:26:48,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +59: [2023-04-29 11:26:48,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +16: [2023-04-29 11:26:48,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +34: [2023-04-29 11:26:48,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +23: [2023-04-29 11:26:48,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +42: [2023-04-29 11:26:48,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +37: [2023-04-29 11:26:48,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +29: [2023-04-29 11:26:48,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +46: [2023-04-29 11:26:48,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 11:26:48,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +14: [2023-04-29 11:26:48,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 11:26:48,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +29: [2023-04-29 11:26:48,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +23: [2023-04-29 11:26:48,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +37: [2023-04-29 11:26:48,297] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +29: [2023-04-29 11:26:48,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +18: [2023-04-29 11:26:48,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +18: [2023-04-29 11:26:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +19: [2023-04-29 11:26:48,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 11:26:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +18: [2023-04-29 11:26:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +61: [2023-04-29 11:26:48,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 11:26:48,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +37: [2023-04-29 11:26:48,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 11:26:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +37: [2023-04-29 11:26:48,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 0: [2023-04-29 11:26:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 0: [2023-04-29 11:26:48,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +23: [2023-04-29 11:26:48,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +14: [2023-04-29 11:26:48,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 0: [2023-04-29 11:26:48,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 7: [2023-04-29 11:26:48,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +16: [2023-04-29 11:26:48,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +23: [2023-04-29 11:26:48,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:48,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 11:26:48,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +32: [2023-04-29 11:26:48,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +19: [2023-04-29 11:26:48,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +19: [2023-04-29 11:26:48,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 11:26:48,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +32: [2023-04-29 11:26:48,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +32: [2023-04-29 11:26:48,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +14: [2023-04-29 11:26:48,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +14: [2023-04-29 11:26:48,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +14: [2023-04-29 11:26:48,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +16: [2023-04-29 11:26:48,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +57: [2023-04-29 11:26:48,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +63: [2023-04-29 11:26:48,303] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +18: [2023-04-29 11:26:48,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +14: [2023-04-29 11:26:48,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +34: [2023-04-29 11:26:48,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +19: [2023-04-29 11:26:48,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +49: [2023-04-29 11:26:48,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +63: [2023-04-29 11:26:48,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +51: [2023-04-29 11:26:48,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +16: [2023-04-29 11:26:48,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +57: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +43: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +43: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +54: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +54: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +56: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +63: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 11:26:48,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 11:26:48,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 11:26:48,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 11:26:48,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +63: [2023-04-29 11:26:48,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +22: [2023-04-29 11:26:48,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +41: [2023-04-29 11:26:48,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 11:26:48,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 11:26:48,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +41: [2023-04-29 11:26:48,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 11:26:48,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 11:26:48,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 11:26:48,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +54: [2023-04-29 11:26:48,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +54: [2023-04-29 11:26:48,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +15: [2023-04-29 11:26:48,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +63: [2023-04-29 11:26:48,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +30: [2023-04-29 11:26:48,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +30: [2023-04-29 11:26:48,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +57: [2023-04-29 11:26:48,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +30: [2023-04-29 11:26:48,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +30: [2023-04-29 11:26:48,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +17: [2023-04-29 11:26:48,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +17: [2023-04-29 11:26:48,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +17: [2023-04-29 11:26:48,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +56: [2023-04-29 11:26:48,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 6: [2023-04-29 11:26:48,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 6: [2023-04-29 11:26:48,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +17: [2023-04-29 11:26:48,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +46: [2023-04-29 11:26:48,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +22: [2023-04-29 11:26:48,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +63: [2023-04-29 11:26:48,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... + 7: [2023-04-29 11:26:48,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +59: [2023-04-29 11:26:48,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 11:26:48,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +54: [2023-04-29 11:26:48,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +54: [2023-04-29 11:26:48,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 11:26:48,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 11:26:48,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +10: [2023-04-29 11:26:48,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 11:26:48,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +54: [2023-04-29 11:26:48,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 11:26:48,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +54: [2023-04-29 11:26:48,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 11:26:48,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 11:26:48,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 11:26:48,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +22: [2023-04-29 11:26:48,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +35: [2023-04-29 11:26:48,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 3: [2023-04-29 11:26:48,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +19: [2023-04-29 11:26:48,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +19: [2023-04-29 11:26:48,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 3: [2023-04-29 11:26:48,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +22: [2023-04-29 11:26:48,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +57: [2023-04-29 11:26:48,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +15: [2023-04-29 11:26:48,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +49: [2023-04-29 11:26:48,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 11:26:48,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 11:26:48,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +28: [2023-04-29 11:26:48,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +28: [2023-04-29 11:26:48,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +35: [2023-04-29 11:26:48,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 11:26:48,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 11:26:48,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +35: [2023-04-29 11:26:48,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +28: [2023-04-29 11:26:48,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +28: [2023-04-29 11:26:48,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 7: [2023-04-29 11:26:48,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +52: [2023-04-29 11:26:48,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 11:26:48,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 11:26:48,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +35: [2023-04-29 11:26:48,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +39: [2023-04-29 11:26:48,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +39: [2023-04-29 11:26:48,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +39: [2023-04-29 11:26:48,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +59: [2023-04-29 11:26:48,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 11:26:48,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 11:26:48,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +35: [2023-04-29 11:26:48,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +35: [2023-04-29 11:26:48,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 11:26:48,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +16: [2023-04-29 11:26:48,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +16: [2023-04-29 11:26:48,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +16: [2023-04-29 11:26:48,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +19: [2023-04-29 11:26:48,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +57: [2023-04-29 11:26:48,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +18: [2023-04-29 11:26:48,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +19: [2023-04-29 11:26:48,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +10: [2023-04-29 11:26:48,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 11:26:48,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +45: [2023-04-29 11:26:48,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 11:26:48,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 11:26:48,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +35: [2023-04-29 11:26:48,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:48,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +10: [2023-04-29 11:26:48,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +16: [2023-04-29 11:26:48,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 11:26:48,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +43: [2023-04-29 11:26:48,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 11:26:48,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 11:26:48,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 11:26:48,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 11:26:48,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 11:26:48,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +12: [2023-04-29 11:26:48,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +58: [2023-04-29 11:26:48,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 11:26:48,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +15: [2023-04-29 11:26:48,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +15: [2023-04-29 11:26:48,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +45: [2023-04-29 11:26:48,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +54: [2023-04-29 11:26:48,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +54: [2023-04-29 11:26:48,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +46: [2023-04-29 11:26:48,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 11:26:48,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 11:26:48,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:48,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 11:26:48,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +46: [2023-04-29 11:26:48,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +29: [2023-04-29 11:26:48,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 11:26:48,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +51: [2023-04-29 11:26:48,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +10: [2023-04-29 11:26:48,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 7: [2023-04-29 11:26:48,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +45: [2023-04-29 11:26:48,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +26: [2023-04-29 11:26:48,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +57: [2023-04-29 11:26:48,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 11:26:48,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +18: [2023-04-29 11:26:48,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +47: [2023-04-29 11:26:48,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 11:26:48,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 11:26:48,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 11:26:48,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 11:26:48,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:48,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 11:26:48,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +12: [2023-04-29 11:26:48,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +54: [2023-04-29 11:26:48,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +54: [2023-04-29 11:26:48,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +16: [2023-04-29 11:26:48,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +18: [2023-04-29 11:26:48,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 11:26:48,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 11:26:48,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +26: [2023-04-29 11:26:48,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +43: [2023-04-29 11:26:48,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 11:26:48,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +15: [2023-04-29 11:26:48,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +58: [2023-04-29 11:26:48,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +57: [2023-04-29 11:26:48,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 11:26:48,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +15: [2023-04-29 11:26:48,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +52: [2023-04-29 11:26:48,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +52: [2023-04-29 11:26:48,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +45: [2023-04-29 11:26:48,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +58: [2023-04-29 11:26:48,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +51: [2023-04-29 11:26:48,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +26: [2023-04-29 11:26:48,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +47: [2023-04-29 11:26:48,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 11:26:48,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +51: [2023-04-29 11:26:48,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +26: [2023-04-29 11:26:48,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +47: [2023-04-29 11:26:48,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +18: [2023-04-29 11:26:48,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +51: [2023-04-29 11:26:48,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 11:26:48,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +47: [2023-04-29 11:26:48,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +47: [2023-04-29 11:26:48,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +51: [2023-04-29 11:26:48,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 11:26:48,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +51: [2023-04-29 11:26:48,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +26: [2023-04-29 11:26:48,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +51: [2023-04-29 11:26:48,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +12: [2023-04-29 11:26:48,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +47: [2023-04-29 11:26:48,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +47: [2023-04-29 11:26:48,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +17: [2023-04-29 11:26:48,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +12: [2023-04-29 11:26:48,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 11:26:48,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +51: [2023-04-29 11:26:48,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... + 4: [2023-04-29 11:26:48,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +46: [2023-04-29 11:26:48,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +58: [2023-04-29 11:26:48,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +44: [2023-04-29 11:26:48,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +26: [2023-04-29 11:26:48,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +51: [2023-04-29 11:26:48,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +59: [2023-04-29 11:26:48,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 11:26:48,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 11:26:48,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 11:26:48,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 11:26:48,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +17: [2023-04-29 11:26:48,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +30: [2023-04-29 11:26:48,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +46: [2023-04-29 11:26:48,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +12: [2023-04-29 11:26:48,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 11:26:48,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +30: [2023-04-29 11:26:48,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +10: [2023-04-29 11:26:48,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +46: [2023-04-29 11:26:48,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +12: [2023-04-29 11:26:48,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +12: [2023-04-29 11:26:48,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 9: [2023-04-29 11:26:48,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +51: [2023-04-29 11:26:48,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +44: [2023-04-29 11:26:48,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 11:26:48,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +62: [2023-04-29 11:26:48,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +62: [2023-04-29 11:26:48,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +62: [2023-04-29 11:26:48,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +13: [2023-04-29 11:26:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +43: [2023-04-29 11:26:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 11:26:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. + 6: [2023-04-29 11:26:48,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +36: [2023-04-29 11:26:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 11:26:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +36: [2023-04-29 11:26:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +28: [2023-04-29 11:26:48,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 11:26:48,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +60: [2023-04-29 11:26:48,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 11:26:48,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +46: [2023-04-29 11:26:48,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +46: [2023-04-29 11:26:48,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +26: [2023-04-29 11:26:48,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +59: [2023-04-29 11:26:48,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 11:26:48,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +60: [2023-04-29 11:26:48,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +28: [2023-04-29 11:26:48,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 11:26:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +13: [2023-04-29 11:26:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +13: [2023-04-29 11:26:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 11:26:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +10: [2023-04-29 11:26:48,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +12: [2023-04-29 11:26:48,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +60: [2023-04-29 11:26:48,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +28: [2023-04-29 11:26:48,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +60: [2023-04-29 11:26:48,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +35: [2023-04-29 11:26:48,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 11:26:48,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +49: [2023-04-29 11:26:48,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +10: [2023-04-29 11:26:48,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +14: [2023-04-29 11:26:48,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +35: [2023-04-29 11:26:48,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 9: [2023-04-29 11:26:48,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +57: [2023-04-29 11:26:48,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 11:26:48,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 11:26:48,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +30: [2023-04-29 11:26:48,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +39: [2023-04-29 11:26:48,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +35: [2023-04-29 11:26:48,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +43: [2023-04-29 11:26:48,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +43: [2023-04-29 11:26:48,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 11:26:48,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 11:26:48,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +39: [2023-04-29 11:26:48,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +39: [2023-04-29 11:26:48,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +59: [2023-04-29 11:26:48,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 11:26:48,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... + 2: [2023-04-29 11:26:48,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 2: [2023-04-29 11:26:48,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 2: [2023-04-29 11:26:48,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +54: [2023-04-29 11:26:48,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +26: [2023-04-29 11:26:48,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 2: [2023-04-29 11:26:48,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +46: [2023-04-29 11:26:48,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +37: [2023-04-29 11:26:48,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +10: [2023-04-29 11:26:48,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +10: [2023-04-29 11:26:48,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 4: [2023-04-29 11:26:48,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +54: [2023-04-29 11:26:48,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +54: [2023-04-29 11:26:48,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 11:26:48,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +44: [2023-04-29 11:26:48,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +42: [2023-04-29 11:26:48,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +35: [2023-04-29 11:26:48,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +30: [2023-04-29 11:26:48,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 11:26:48,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 11:26:48,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +35: [2023-04-29 11:26:48,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 11:26:48,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 0: [2023-04-29 11:26:48,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +60: [2023-04-29 11:26:48,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +54: [2023-04-29 11:26:48,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +60: [2023-04-29 11:26:48,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 11:26:48,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 11:26:48,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 11:26:48,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 11:26:48,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 11:26:48,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 11:26:48,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 11:26:48,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +43: [2023-04-29 11:26:48,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:48,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +60: [2023-04-29 11:26:48,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 11:26:48,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 11:26:48,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 11:26:48,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 11:26:48,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +15: [2023-04-29 11:26:48,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 11:26:48,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +23: [2023-04-29 11:26:48,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +37: [2023-04-29 11:26:48,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +44: [2023-04-29 11:26:48,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +14: [2023-04-29 11:26:48,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +23: [2023-04-29 11:26:48,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +23: [2023-04-29 11:26:48,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +33: [2023-04-29 11:26:48,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +33: [2023-04-29 11:26:48,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +37: [2023-04-29 11:26:48,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 11:26:48,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. + 6: [2023-04-29 11:26:48,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +44: [2023-04-29 11:26:48,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +33: [2023-04-29 11:26:48,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +15: [2023-04-29 11:26:48,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 11:26:48,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 11:26:48,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +23: [2023-04-29 11:26:48,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +15: [2023-04-29 11:26:48,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +62: [2023-04-29 11:26:48,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 11:26:48,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 11:26:48,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +43: [2023-04-29 11:26:48,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +36: [2023-04-29 11:26:48,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 11:26:48,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +62: [2023-04-29 11:26:48,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 11:26:48,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +62: [2023-04-29 11:26:48,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +22: [2023-04-29 11:26:48,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +36: [2023-04-29 11:26:48,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 11:26:48,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +13: [2023-04-29 11:26:48,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 11:26:48,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +62: [2023-04-29 11:26:48,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 11:26:48,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +60: [2023-04-29 11:26:48,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 11:26:48,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +16: [2023-04-29 11:26:48,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 11:26:48,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 11:26:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +60: [2023-04-29 11:26:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +30: [2023-04-29 11:26:48,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +60: [2023-04-29 11:26:48,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 11:26:48,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +31: [2023-04-29 11:26:48,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +31: [2023-04-29 11:26:48,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 8: [2023-04-29 11:26:48,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +52: [2023-04-29 11:26:48,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:48,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +14: [2023-04-29 11:26:48,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 11:26:48,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +41: [2023-04-29 11:26:48,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +37: [2023-04-29 11:26:48,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 11:26:48,387] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 11:26:48,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +52: [2023-04-29 11:26:48,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +16: [2023-04-29 11:26:48,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +41: [2023-04-29 11:26:48,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 11:26:48,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +31: [2023-04-29 11:26:48,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +60: [2023-04-29 11:26:48,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +31: [2023-04-29 11:26:48,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +22: [2023-04-29 11:26:48,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +43: [2023-04-29 11:26:48,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 11:26:48,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +22: [2023-04-29 11:26:48,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +49: [2023-04-29 11:26:48,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +49: [2023-04-29 11:26:48,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +29: [2023-04-29 11:26:48,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +49: [2023-04-29 11:26:48,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +49: [2023-04-29 11:26:48,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +43: [2023-04-29 11:26:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 11:26:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +22: [2023-04-29 11:26:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +44: [2023-04-29 11:26:48,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +54: [2023-04-29 11:26:48,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +42: [2023-04-29 11:26:48,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 8: [2023-04-29 11:26:48,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +54: [2023-04-29 11:26:48,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 11:26:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +29: [2023-04-29 11:26:48,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +29: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +52: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +11: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +11: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +11: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +21: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +21: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +30: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +30: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +30: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +27: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +27: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +11: [2023-04-29 11:26:48,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +27: [2023-04-29 11:26:48,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +43: [2023-04-29 11:26:48,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +43: [2023-04-29 11:26:48,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... + 2: [2023-04-29 11:26:48,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 11:26:48,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +21: [2023-04-29 11:26:48,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +43: [2023-04-29 11:26:48,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +16: [2023-04-29 11:26:48,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 11:26:48,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 11:26:48,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +43: [2023-04-29 11:26:48,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +42: [2023-04-29 11:26:48,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 11:26:48,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 11:26:48,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +18: [2023-04-29 11:26:48,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +13: [2023-04-29 11:26:48,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +47: [2023-04-29 11:26:48,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +60: [2023-04-29 11:26:48,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +13: [2023-04-29 11:26:48,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +13: [2023-04-29 11:26:48,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +13: [2023-04-29 11:26:48,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +29: [2023-04-29 11:26:48,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +45: [2023-04-29 11:26:48,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 11:26:48,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +33: [2023-04-29 11:26:48,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +14: [2023-04-29 11:26:48,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +22: [2023-04-29 11:26:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +22: [2023-04-29 11:26:48,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +62: [2023-04-29 11:26:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 11:26:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 11:26:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 11:26:48,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +22: [2023-04-29 11:26:48,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 11:26:48,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +52: [2023-04-29 11:26:48,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +17: [2023-04-29 11:26:48,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 11:26:48,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +18: [2023-04-29 11:26:48,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +29: [2023-04-29 11:26:48,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 11:26:48,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +16: [2023-04-29 11:26:48,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +16: [2023-04-29 11:26:48,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +60: [2023-04-29 11:26:48,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 11:26:48,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +55: [2023-04-29 11:26:48,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 3: [2023-04-29 11:26:48,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +54: [2023-04-29 11:26:48,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +22: [2023-04-29 11:26:48,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +55: [2023-04-29 11:26:48,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +55: [2023-04-29 11:26:48,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +29: [2023-04-29 11:26:48,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +55: [2023-04-29 11:26:48,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +62: [2023-04-29 11:26:48,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +22: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +54: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +17: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +18: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 6: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +33: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +33: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +32: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +32: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +62: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +62: [2023-04-29 11:26:48,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 11:26:48,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +25: [2023-04-29 11:26:48,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +25: [2023-04-29 11:26:48,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +25: [2023-04-29 11:26:48,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +47: [2023-04-29 11:26:48,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:48,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 11:26:48,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 3: [2023-04-29 11:26:48,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +47: [2023-04-29 11:26:48,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +17: [2023-04-29 11:26:48,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +17: [2023-04-29 11:26:48,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 5: [2023-04-29 11:26:48,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +33: [2023-04-29 11:26:48,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 11:26:48,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:48,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. + 6: [2023-04-29 11:26:48,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 11:26:48,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +29: [2023-04-29 11:26:48,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +41: [2023-04-29 11:26:48,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +16: [2023-04-29 11:26:48,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +32: [2023-04-29 11:26:48,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +12: [2023-04-29 11:26:48,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 11:26:48,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 11:26:48,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +47: [2023-04-29 11:26:48,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +18: [2023-04-29 11:26:48,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +29: [2023-04-29 11:26:48,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +45: [2023-04-29 11:26:48,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +17: [2023-04-29 11:26:48,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +17: [2023-04-29 11:26:48,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +54: [2023-04-29 11:26:48,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +28: [2023-04-29 11:26:48,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 11:26:48,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 11:26:48,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +35: [2023-04-29 11:26:48,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +28: [2023-04-29 11:26:48,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 11:26:48,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +14: [2023-04-29 11:26:48,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 11:26:48,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 11:26:48,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +52: [2023-04-29 11:26:48,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +30: [2023-04-29 11:26:48,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +52: [2023-04-29 11:26:48,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +52: [2023-04-29 11:26:48,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +31: [2023-04-29 11:26:48,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +31: [2023-04-29 11:26:48,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +50: [2023-04-29 11:26:48,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +50: [2023-04-29 11:26:48,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +50: [2023-04-29 11:26:48,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +50: [2023-04-29 11:26:48,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +41: [2023-04-29 11:26:48,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 11:26:48,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +49: [2023-04-29 11:26:48,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +49: [2023-04-29 11:26:48,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +27: [2023-04-29 11:26:48,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +49: [2023-04-29 11:26:48,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +52: [2023-04-29 11:26:48,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +21: [2023-04-29 11:26:48,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +54: [2023-04-29 11:26:48,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +41: [2023-04-29 11:26:48,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 11:26:48,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 11:26:48,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +31: [2023-04-29 11:26:48,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +49: [2023-04-29 11:26:48,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +27: [2023-04-29 11:26:48,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +27: [2023-04-29 11:26:48,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +39: [2023-04-29 11:26:48,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 11:26:48,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +30: [2023-04-29 11:26:48,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +30: [2023-04-29 11:26:48,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +28: [2023-04-29 11:26:48,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +28: [2023-04-29 11:26:48,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +33: [2023-04-29 11:26:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +33: [2023-04-29 11:26:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +28: [2023-04-29 11:26:48,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +28: [2023-04-29 11:26:48,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +22: [2023-04-29 11:26:48,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +22: [2023-04-29 11:26:48,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 11:26:48,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +54: [2023-04-29 11:26:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +35: [2023-04-29 11:26:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +33: [2023-04-29 11:26:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +33: [2023-04-29 11:26:48,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 11:26:48,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +52: [2023-04-29 11:26:48,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +21: [2023-04-29 11:26:48,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +21: [2023-04-29 11:26:48,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +47: [2023-04-29 11:26:48,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 6: [2023-04-29 11:26:48,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +54: [2023-04-29 11:26:48,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +45: [2023-04-29 11:26:48,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 11:26:48,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 11:26:48,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +33: [2023-04-29 11:26:48,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +33: [2023-04-29 11:26:48,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +35: [2023-04-29 11:26:48,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 11:26:48,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 11:26:48,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +39: [2023-04-29 11:26:48,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +11: [2023-04-29 11:26:48,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +24: [2023-04-29 11:26:48,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 11:26:48,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 11:26:48,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 11:26:48,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 11:26:48,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +35: [2023-04-29 11:26:48,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +39: [2023-04-29 11:26:48,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +39: [2023-04-29 11:26:48,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +22: [2023-04-29 11:26:48,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +22: [2023-04-29 11:26:48,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +55: [2023-04-29 11:26:48,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +33: [2023-04-29 11:26:48,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +33: [2023-04-29 11:26:48,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 3: [2023-04-29 11:26:48,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +59: [2023-04-29 11:26:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +59: [2023-04-29 11:26:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. + 6: [2023-04-29 11:26:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +30: [2023-04-29 11:26:48,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +20: [2023-04-29 11:26:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +23: [2023-04-29 11:26:48,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 11:26:48,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +20: [2023-04-29 11:26:48,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +23: [2023-04-29 11:26:48,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 11:26:48,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 11:26:48,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_15-model_01-model_states.pt. +54: [2023-04-29 11:26:48,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +23: [2023-04-29 11:26:48,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:48,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +11: [2023-04-29 11:26:48,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +13: [2023-04-29 11:26:48,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +52: [2023-04-29 11:26:48,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +13: [2023-04-29 11:26:48,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +13: [2023-04-29 11:26:48,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +13: [2023-04-29 11:26:48,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +35: [2023-04-29 11:26:48,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +54: [2023-04-29 11:26:48,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +40: [2023-04-29 11:26:48,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +40: [2023-04-29 11:26:48,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +35: [2023-04-29 11:26:48,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +24: [2023-04-29 11:26:48,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 11:26:48,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 11:26:48,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 11:26:48,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +54: [2023-04-29 11:26:48,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +32: [2023-04-29 11:26:48,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +15: [2023-04-29 11:26:48,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 11:26:48,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +40: [2023-04-29 11:26:48,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +55: [2023-04-29 11:26:48,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +40: [2023-04-29 11:26:48,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +44: [2023-04-29 11:26:48,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +44: [2023-04-29 11:26:48,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +55: [2023-04-29 11:26:48,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +59: [2023-04-29 11:26:48,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +59: [2023-04-29 11:26:48,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +39: [2023-04-29 11:26:48,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +39: [2023-04-29 11:26:48,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +30: [2023-04-29 11:26:48,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +25: [2023-04-29 11:26:48,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +25: [2023-04-29 11:26:48,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +25: [2023-04-29 11:26:48,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +23: [2023-04-29 11:26:48,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 11:26:48,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +23: [2023-04-29 11:26:48,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +55: [2023-04-29 11:26:48,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +45: [2023-04-29 11:26:48,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +44: [2023-04-29 11:26:48,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +52: [2023-04-29 11:26:48,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +15: [2023-04-29 11:26:48,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 11:26:48,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +48: [2023-04-29 11:26:48,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +48: [2023-04-29 11:26:48,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +48: [2023-04-29 11:26:48,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. + 5: [2023-04-29 11:26:48,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +44: [2023-04-29 11:26:48,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 5: [2023-04-29 11:26:48,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +48: [2023-04-29 11:26:48,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +23: [2023-04-29 11:26:48,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +54: [2023-04-29 11:26:48,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... + 1: [2023-04-29 11:26:48,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +32: [2023-04-29 11:26:48,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 11:26:48,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +23: [2023-04-29 11:26:48,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +45: [2023-04-29 11:26:48,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 11:26:48,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +22: [2023-04-29 11:26:48,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +47: [2023-04-29 11:26:48,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +22: [2023-04-29 11:26:48,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +62: [2023-04-29 11:26:48,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +54: [2023-04-29 11:26:48,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +50: [2023-04-29 11:26:48,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 11:26:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +38: [2023-04-29 11:26:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +54: [2023-04-29 11:26:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +38: [2023-04-29 11:26:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +38: [2023-04-29 11:26:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +47: [2023-04-29 11:26:48,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 11:26:48,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 11:26:48,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +56: [2023-04-29 11:26:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +56: [2023-04-29 11:26:48,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +60: [2023-04-29 11:26:48,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +18: [2023-04-29 11:26:48,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 11:26:48,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 11:26:48,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 11:26:48,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +50: [2023-04-29 11:26:48,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 11:26:48,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 11:26:48,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +62: [2023-04-29 11:26:48,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +62: [2023-04-29 11:26:48,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +60: [2023-04-29 11:26:48,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +60: [2023-04-29 11:26:48,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 11:26:48,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +62: [2023-04-29 11:26:48,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 11:26:48,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 11:26:48,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +54: [2023-04-29 11:26:48,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +54: [2023-04-29 11:26:48,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +32: [2023-04-29 11:26:48,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +12: [2023-04-29 11:26:48,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 11:26:48,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 11:26:48,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 11:26:48,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 11:26:48,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +62: [2023-04-29 11:26:48,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +29: [2023-04-29 11:26:48,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 11:26:48,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 11:26:48,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +60: [2023-04-29 11:26:48,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +29: [2023-04-29 11:26:48,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +60: [2023-04-29 11:26:48,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +62: [2023-04-29 11:26:48,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +59: [2023-04-29 11:26:48,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +59: [2023-04-29 11:26:48,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +62: [2023-04-29 11:26:48,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +18: [2023-04-29 11:26:48,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 11:26:48,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +18: [2023-04-29 11:26:48,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +59: [2023-04-29 11:26:48,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +18: [2023-04-29 11:26:48,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 11:26:48,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +20: [2023-04-29 11:26:48,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 11:26:48,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 11:26:48,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +40: [2023-04-29 11:26:48,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +60: [2023-04-29 11:26:48,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 11:26:48,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +29: [2023-04-29 11:26:48,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 11:26:48,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... +29: [2023-04-29 11:26:48,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +40: [2023-04-29 11:26:48,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +15: [2023-04-29 11:26:48,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 11:26:48,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +40: [2023-04-29 11:26:48,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +20: [2023-04-29 11:26:48,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +62: [2023-04-29 11:26:48,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 11:26:48,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +44: [2023-04-29 11:26:48,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +44: [2023-04-29 11:26:48,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +60: [2023-04-29 11:26:48,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +44: [2023-04-29 11:26:48,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +48: [2023-04-29 11:26:48,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +44: [2023-04-29 11:26:48,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +48: [2023-04-29 11:26:48,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 11:26:48,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 11:26:48,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 11:26:48,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +15: [2023-04-29 11:26:48,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 11:26:48,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +48: [2023-04-29 11:26:48,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +62: [2023-04-29 11:26:48,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +21: [2023-04-29 11:26:48,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 3: [2023-04-29 11:26:48,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +56: [2023-04-29 11:26:48,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 11:26:48,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... + 1: [2023-04-29 11:26:48,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +49: [2023-04-29 11:26:48,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +49: [2023-04-29 11:26:48,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +27: [2023-04-29 11:26:48,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +34: [2023-04-29 11:26:48,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +34: [2023-04-29 11:26:48,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. + 3: [2023-04-29 11:26:48,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 2: [2023-04-29 11:26:48,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 2: [2023-04-29 11:26:48,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +56: [2023-04-29 11:26:48,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +38: [2023-04-29 11:26:48,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 11:26:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +33: [2023-04-29 11:26:48,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 11:26:48,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +34: [2023-04-29 11:26:48,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +62: [2023-04-29 11:26:48,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 11:26:48,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 11:26:48,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 1: [2023-04-29 11:26:48,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +41: [2023-04-29 11:26:48,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +41: [2023-04-29 11:26:48,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +41: [2023-04-29 11:26:48,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 1: [2023-04-29 11:26:48,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 11:26:48,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 11:26:48,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 11:26:48,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 11:26:48,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 11:26:48,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 11:26:48,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +38: [2023-04-29 11:26:48,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 11:26:48,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 11:26:48,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +49: [2023-04-29 11:26:48,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +27: [2023-04-29 11:26:48,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 11:26:48,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +55: [2023-04-29 11:26:48,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 11:26:48,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 11:26:48,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +27: [2023-04-29 11:26:48,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +33: [2023-04-29 11:26:48,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +53: [2023-04-29 11:26:48,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +53: [2023-04-29 11:26:48,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +53: [2023-04-29 11:26:48,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. + 2: [2023-04-29 11:26:48,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 11:26:48,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +56: [2023-04-29 11:26:48,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +53: [2023-04-29 11:26:48,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +45: [2023-04-29 11:26:48,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +45: [2023-04-29 11:26:48,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +45: [2023-04-29 11:26:48,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +45: [2023-04-29 11:26:48,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +49: [2023-04-29 11:26:48,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +31: [2023-04-29 11:26:48,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 11:26:48,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 11:26:48,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +49: [2023-04-29 11:26:48,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +55: [2023-04-29 11:26:48,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +31: [2023-04-29 11:26:48,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 11:26:48,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 5: [2023-04-29 11:26:48,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 11:26:48,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +11: [2023-04-29 11:26:48,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 2: [2023-04-29 11:26:48,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +24: [2023-04-29 11:26:48,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +52: [2023-04-29 11:26:48,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +31: [2023-04-29 11:26:48,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 11:26:48,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +61: [2023-04-29 11:26:48,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +61: [2023-04-29 11:26:48,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +49: [2023-04-29 11:26:48,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +49: [2023-04-29 11:26:48,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... + 2: [2023-04-29 11:26:48,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 11:26:48,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 11:26:48,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +62: [2023-04-29 11:26:48,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 11:26:48,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +61: [2023-04-29 11:26:48,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +52: [2023-04-29 11:26:48,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +27: [2023-04-29 11:26:48,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +31: [2023-04-29 11:26:48,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +52: [2023-04-29 11:26:48,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +21: [2023-04-29 11:26:48,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +21: [2023-04-29 11:26:48,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +32: [2023-04-29 11:26:48,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +55: [2023-04-29 11:26:48,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 11:26:48,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +23: [2023-04-29 11:26:48,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 11:26:48,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 11:26:48,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +33: [2023-04-29 11:26:48,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +22: [2023-04-29 11:26:48,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 11:26:48,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +33: [2023-04-29 11:26:48,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +33: [2023-04-29 11:26:48,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 11:26:48,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +13: [2023-04-29 11:26:48,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 11:26:48,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 11:26:48,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 11:26:48,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 11:26:48,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 11:26:48,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 11:26:48,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 11:26:48,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 11:26:48,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +31: [2023-04-29 11:26:48,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +25: [2023-04-29 11:26:48,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 11:26:48,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 11:26:48,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +52: [2023-04-29 11:26:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +55: [2023-04-29 11:26:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +27: [2023-04-29 11:26:48,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +62: [2023-04-29 11:26:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +23: [2023-04-29 11:26:48,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +52: [2023-04-29 11:26:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +52: [2023-04-29 11:26:48,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +23: [2023-04-29 11:26:48,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +22: [2023-04-29 11:26:48,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +32: [2023-04-29 11:26:48,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +31: [2023-04-29 11:26:48,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +21: [2023-04-29 11:26:48,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +21: [2023-04-29 11:26:48,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +34: [2023-04-29 11:26:48,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 11:26:48,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +33: [2023-04-29 11:26:48,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +33: [2023-04-29 11:26:48,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +22: [2023-04-29 11:26:48,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +13: [2023-04-29 11:26:48,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +25: [2023-04-29 11:26:48,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 11:26:48,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +13: [2023-04-29 11:26:48,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +25: [2023-04-29 11:26:48,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 11:26:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +21: [2023-04-29 11:26:48,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 9: [2023-04-29 11:26:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:48,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +62: [2023-04-29 11:26:48,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 11:26:48,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +55: [2023-04-29 11:26:48,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 11:26:48,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +55: [2023-04-29 11:26:48,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +13: [2023-04-29 11:26:48,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +41: [2023-04-29 11:26:48,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +53: [2023-04-29 11:26:48,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +12: [2023-04-29 11:26:48,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +50: [2023-04-29 11:26:48,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 11:26:48,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +41: [2023-04-29 11:26:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 11:26:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 11:26:48,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +22: [2023-04-29 11:26:48,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +34: [2023-04-29 11:26:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +13: [2023-04-29 11:26:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +53: [2023-04-29 11:26:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 11:26:48,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +53: [2023-04-29 11:26:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 11:26:48,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +33: [2023-04-29 11:26:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 11:26:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +25: [2023-04-29 11:26:48,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +53: [2023-04-29 11:26:48,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 11:26:48,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +42: [2023-04-29 11:26:48,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +42: [2023-04-29 11:26:48,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +42: [2023-04-29 11:26:48,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +11: [2023-04-29 11:26:48,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +25: [2023-04-29 11:26:48,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +42: [2023-04-29 11:26:48,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_36-model_01-model_states.pt. +11: [2023-04-29 11:26:48,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +45: [2023-04-29 11:26:48,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +50: [2023-04-29 11:26:48,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +50: [2023-04-29 11:26:48,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +34: [2023-04-29 11:26:48,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +45: [2023-04-29 11:26:48,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +11: [2023-04-29 11:26:48,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +55: [2023-04-29 11:26:48,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... + 5: [2023-04-29 11:26:48,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +13: [2023-04-29 11:26:48,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +22: [2023-04-29 11:26:48,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +59: [2023-04-29 11:26:48,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +57: [2023-04-29 11:26:48,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +57: [2023-04-29 11:26:48,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +57: [2023-04-29 11:26:48,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +29: [2023-04-29 11:26:48,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +57: [2023-04-29 11:26:48,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +50: [2023-04-29 11:26:48,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +50: [2023-04-29 11:26:48,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +55: [2023-04-29 11:26:48,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +23: [2023-04-29 11:26:48,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +32: [2023-04-29 11:26:48,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 11:26:48,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 11:26:48,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +12: [2023-04-29 11:26:48,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +61: [2023-04-29 11:26:48,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 11:26:48,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +24: [2023-04-29 11:26:48,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 11:26:48,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +25: [2023-04-29 11:26:48,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +50: [2023-04-29 11:26:48,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +50: [2023-04-29 11:26:48,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +61: [2023-04-29 11:26:48,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +33: [2023-04-29 11:26:48,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +11: [2023-04-29 11:26:48,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 5: [2023-04-29 11:26:48,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +12: [2023-04-29 11:26:48,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +45: [2023-04-29 11:26:48,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +45: [2023-04-29 11:26:48,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +22: [2023-04-29 11:26:48,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +61: [2023-04-29 11:26:48,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 11:26:48,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 11:26:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +59: [2023-04-29 11:26:48,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +24: [2023-04-29 11:26:48,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:48,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +32: [2023-04-29 11:26:48,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... + 5: [2023-04-29 11:26:48,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +32: [2023-04-29 11:26:48,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +11: [2023-04-29 11:26:48,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... + 5: [2023-04-29 11:26:48,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +22: [2023-04-29 11:26:48,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +23: [2023-04-29 11:26:48,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 11:26:48,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 11:26:48,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 11:26:48,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +29: [2023-04-29 11:26:48,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +63: [2023-04-29 11:26:48,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +63: [2023-04-29 11:26:48,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 8: [2023-04-29 11:26:48,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +63: [2023-04-29 11:26:48,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 8: [2023-04-29 11:26:48,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +33: [2023-04-29 11:26:48,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 11:26:48,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +59: [2023-04-29 11:26:48,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +59: [2023-04-29 11:26:48,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +36: [2023-04-29 11:26:48,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +36: [2023-04-29 11:26:48,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +23: [2023-04-29 11:26:48,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 11:26:48,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +59: [2023-04-29 11:26:48,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +29: [2023-04-29 11:26:48,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 11:26:48,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +32: [2023-04-29 11:26:48,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +24: [2023-04-29 11:26:48,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +20: [2023-04-29 11:26:48,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +23: [2023-04-29 11:26:48,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +36: [2023-04-29 11:26:48,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +44: [2023-04-29 11:26:48,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +44: [2023-04-29 11:26:48,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +37: [2023-04-29 11:26:48,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +37: [2023-04-29 11:26:48,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. + 8: [2023-04-29 11:26:48,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +44: [2023-04-29 11:26:48,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 11:26:48,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +36: [2023-04-29 11:26:48,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +20: [2023-04-29 11:26:48,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +20: [2023-04-29 11:26:48,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_00-model_states.pt. +44: [2023-04-29 11:26:48,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +59: [2023-04-29 11:26:48,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +18: [2023-04-29 11:26:48,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 11:26:48,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +37: [2023-04-29 11:26:48,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +37: [2023-04-29 11:26:48,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +18: [2023-04-29 11:26:48,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +44: [2023-04-29 11:26:48,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +44: [2023-04-29 11:26:48,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +51: [2023-04-29 11:26:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +51: [2023-04-29 11:26:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +44: [2023-04-29 11:26:48,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +51: [2023-04-29 11:26:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +51: [2023-04-29 11:26:48,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +29: [2023-04-29 11:26:48,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 11:26:48,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +42: [2023-04-29 11:26:48,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +42: [2023-04-29 11:26:48,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +20: [2023-04-29 11:26:48,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +44: [2023-04-29 11:26:48,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +57: [2023-04-29 11:26:48,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 11:26:48,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +20: [2023-04-29 11:26:48,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt... +56: [2023-04-29 11:26:48,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +57: [2023-04-29 11:26:48,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +57: [2023-04-29 11:26:48,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 11:26:48,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt... +38: [2023-04-29 11:26:48,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 11:26:48,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +33: [2023-04-29 11:26:48,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 11:26:48,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 11:26:48,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +56: [2023-04-29 11:26:48,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... + 2: [2023-04-29 11:26:48,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 11:26:48,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +38: [2023-04-29 11:26:48,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +56: [2023-04-29 11:26:48,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +29: [2023-04-29 11:26:48,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 11:26:48,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 11:26:48,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 11:26:48,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +38: [2023-04-29 11:26:48,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +38: [2023-04-29 11:26:48,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +36: [2023-04-29 11:26:48,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 11:26:48,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 11:26:48,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +46: [2023-04-29 11:26:48,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +33: [2023-04-29 11:26:48,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 11:26:48,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +56: [2023-04-29 11:26:48,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +31: [2023-04-29 11:26:48,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +46: [2023-04-29 11:26:48,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +25: [2023-04-29 11:26:48,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +28: [2023-04-29 11:26:48,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +36: [2023-04-29 11:26:48,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +28: [2023-04-29 11:26:48,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +28: [2023-04-29 11:26:48,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +63: [2023-04-29 11:26:48,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +26: [2023-04-29 11:26:48,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +28: [2023-04-29 11:26:48,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 11:26:48,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 11:26:48,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 11:26:48,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 11:26:48,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +63: [2023-04-29 11:26:48,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +36: [2023-04-29 11:26:48,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +26: [2023-04-29 11:26:48,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +56: [2023-04-29 11:26:48,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +29: [2023-04-29 11:26:48,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 11:26:48,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +18: [2023-04-29 11:26:48,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +38: [2023-04-29 11:26:48,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +18: [2023-04-29 11:26:48,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 11:26:48,564] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +63: [2023-04-29 11:26:48,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +28: [2023-04-29 11:26:48,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 11:26:48,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +26: [2023-04-29 11:26:48,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +26: [2023-04-29 11:26:48,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +37: [2023-04-29 11:26:48,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 11:26:48,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +26: [2023-04-29 11:26:48,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 11:26:48,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +37: [2023-04-29 11:26:48,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +28: [2023-04-29 11:26:48,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +51: [2023-04-29 11:26:48,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +27: [2023-04-29 11:26:48,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 11:26:48,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 11:26:48,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 11:26:48,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 11:26:48,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +51: [2023-04-29 11:26:48,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +28: [2023-04-29 11:26:48,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +41: [2023-04-29 11:26:48,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 11:26:48,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +51: [2023-04-29 11:26:48,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +37: [2023-04-29 11:26:48,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +51: [2023-04-29 11:26:48,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +27: [2023-04-29 11:26:48,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 11:26:48,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 11:26:48,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 11:26:48,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +41: [2023-04-29 11:26:48,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +25: [2023-04-29 11:26:48,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +58: [2023-04-29 11:26:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +58: [2023-04-29 11:26:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +58: [2023-04-29 11:26:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +58: [2023-04-29 11:26:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +19: [2023-04-29 11:26:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 11:26:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 11:26:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 11:26:48,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 11:26:48,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +19: [2023-04-29 11:26:48,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +47: [2023-04-29 11:26:48,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +47: [2023-04-29 11:26:48,579] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. + 9: [2023-04-29 11:26:48,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +41: [2023-04-29 11:26:48,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 11:26:48,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +47: [2023-04-29 11:26:48,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +19: [2023-04-29 11:26:48,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 11:26:48,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +19: [2023-04-29 11:26:48,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +45: [2023-04-29 11:26:48,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +19: [2023-04-29 11:26:48,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 11:26:48,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 11:26:48,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 11:26:48,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +31: [2023-04-29 11:26:48,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 11:26:48,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +41: [2023-04-29 11:26:48,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 11:26:48,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +31: [2023-04-29 11:26:48,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +41: [2023-04-29 11:26:48,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +45: [2023-04-29 11:26:48,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +18: [2023-04-29 11:26:48,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 11:26:48,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 11:26:48,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +25: [2023-04-29 11:26:48,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +45: [2023-04-29 11:26:48,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 2: [2023-04-29 11:26:48,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +46: [2023-04-29 11:26:48,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +45: [2023-04-29 11:26:48,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 11:26:48,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +41: [2023-04-29 11:26:48,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +45: [2023-04-29 11:26:48,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +25: [2023-04-29 11:26:48,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +45: [2023-04-29 11:26:48,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +17: [2023-04-29 11:26:48,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 11:26:48,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 11:26:48,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 11:26:48,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 11:26:48,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 11:26:48,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 11:26:48,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 11:26:48,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +45: [2023-04-29 11:26:48,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +42: [2023-04-29 11:26:48,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +42: [2023-04-29 11:26:48,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +20: [2023-04-29 11:26:48,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 11:26:48,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 11:26:48,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 11:26:48,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 11:26:48,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 11:26:48,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 11:26:48,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 11:26:48,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 11:26:48,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +58: [2023-04-29 11:26:48,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +45: [2023-04-29 11:26:48,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +20: [2023-04-29 11:26:48,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 11:26:48,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 11:26:48,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 11:26:48,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 11:26:48,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +42: [2023-04-29 11:26:48,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... + 9: [2023-04-29 11:26:48,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +58: [2023-04-29 11:26:48,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +58: [2023-04-29 11:26:48,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +58: [2023-04-29 11:26:48,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 11:26:48,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +47: [2023-04-29 11:26:48,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 11:26:48,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +10: [2023-04-29 11:26:48,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 11:26:48,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 11:26:48,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +35: [2023-04-29 11:26:48,608] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +25: [2023-04-29 11:26:48,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +57: [2023-04-29 11:26:48,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +10: [2023-04-29 11:26:48,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 11:26:48,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 11:26:48,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +57: [2023-04-29 11:26:48,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +42: [2023-04-29 11:26:48,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +35: [2023-04-29 11:26:48,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. + 9: [2023-04-29 11:26:48,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 11:26:48,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_00-model_states.pt. +47: [2023-04-29 11:26:48,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 11:26:48,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +47: [2023-04-29 11:26:48,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 11:26:48,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 11:26:48,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... +57: [2023-04-29 11:26:48,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +57: [2023-04-29 11:26:48,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +42: [2023-04-29 11:26:48,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt... + 9: [2023-04-29 11:26:48,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +16: [2023-04-29 11:26:48,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 11:26:48,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 8: [2023-04-29 11:26:48,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +16: [2023-04-29 11:26:48,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 11:26:48,624] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +57: [2023-04-29 11:26:48,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +26: [2023-04-29 11:26:48,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +63: [2023-04-29 11:26:48,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +63: [2023-04-29 11:26:48,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +16: [2023-04-29 11:26:48,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 11:26:48,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 11:26:48,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 11:26:48,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 11:26:48,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 11:26:48,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +26: [2023-04-29 11:26:48,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +39: [2023-04-29 11:26:48,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +39: [2023-04-29 11:26:48,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +39: [2023-04-29 11:26:48,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +39: [2023-04-29 11:26:48,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +63: [2023-04-29 11:26:48,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +16: [2023-04-29 11:26:48,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +51: [2023-04-29 11:26:48,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +16: [2023-04-29 11:26:48,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +16: [2023-04-29 11:26:48,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 11:26:48,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 11:26:48,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +63: [2023-04-29 11:26:48,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +28: [2023-04-29 11:26:48,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 11:26:48,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 11:26:48,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 11:26:48,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:48,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 11:26:48,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +51: [2023-04-29 11:26:48,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 11:26:48,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 11:26:48,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +28: [2023-04-29 11:26:48,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:48,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 11:26:48,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 11:26:48,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +51: [2023-04-29 11:26:48,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +35: [2023-04-29 11:26:48,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 11:26:48,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +35: [2023-04-29 11:26:48,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +63: [2023-04-29 11:26:48,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +13: [2023-04-29 11:26:48,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +26: [2023-04-29 11:26:48,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 11:26:48,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +28: [2023-04-29 11:26:48,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +28: [2023-04-29 11:26:48,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +51: [2023-04-29 11:26:48,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 11:26:48,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +19: [2023-04-29 11:26:48,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 11:26:48,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +51: [2023-04-29 11:26:48,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +13: [2023-04-29 11:26:48,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 11:26:48,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 11:26:48,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +35: [2023-04-29 11:26:48,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +51: [2023-04-29 11:26:48,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... + 8: [2023-04-29 11:26:48,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 11:26:48,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 11:26:48,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 11:26:48,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 11:26:48,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 11:26:48,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +38: [2023-04-29 11:26:48,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +38: [2023-04-29 11:26:48,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +38: [2023-04-29 11:26:48,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +19: [2023-04-29 11:26:48,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 11:26:48,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 11:26:48,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 11:26:48,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +19: [2023-04-29 11:26:48,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 11:26:48,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +58: [2023-04-29 11:26:48,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 11:26:48,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 11:26:48,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +38: [2023-04-29 11:26:48,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +14: [2023-04-29 11:26:48,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 11:26:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 11:26:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +22: [2023-04-29 11:26:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +22: [2023-04-29 11:26:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +58: [2023-04-29 11:26:48,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +22: [2023-04-29 11:26:48,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +39: [2023-04-29 11:26:48,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 11:26:48,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +39: [2023-04-29 11:26:48,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +26: [2023-04-29 11:26:48,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +28: [2023-04-29 11:26:48,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +39: [2023-04-29 11:26:48,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +22: [2023-04-29 11:26:48,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 11:26:48,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 11:26:48,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +28: [2023-04-29 11:26:48,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 11:26:48,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 11:26:48,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +58: [2023-04-29 11:26:48,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +58: [2023-04-29 11:26:48,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +22: [2023-04-29 11:26:48,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +22: [2023-04-29 11:26:48,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +58: [2023-04-29 11:26:48,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +22: [2023-04-29 11:26:48,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +58: [2023-04-29 11:26:48,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +14: [2023-04-29 11:26:48,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +58: [2023-04-29 11:26:48,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +14: [2023-04-29 11:26:48,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 11:26:48,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 11:26:48,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 11:26:48,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 11:26:48,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 11:26:48,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 11:26:48,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 11:26:48,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 11:26:48,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +22: [2023-04-29 11:26:48,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 11:26:48,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +58: [2023-04-29 11:26:48,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +14: [2023-04-29 11:26:48,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 11:26:48,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 11:26:48,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +28: [2023-04-29 11:26:48,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 11:26:48,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +19: [2023-04-29 11:26:48,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 11:26:48,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 11:26:48,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 11:26:48,675] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 11:26:48,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 11:26:48,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +10: [2023-04-29 11:26:48,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +58: [2023-04-29 11:26:48,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 7: [2023-04-29 11:26:48,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 11:26:48,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +49: [2023-04-29 11:26:48,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +49: [2023-04-29 11:26:48,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +49: [2023-04-29 11:26:48,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +49: [2023-04-29 11:26:48,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +17: [2023-04-29 11:26:48,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +58: [2023-04-29 11:26:48,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +17: [2023-04-29 11:26:48,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +19: [2023-04-29 11:26:48,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 11:26:48,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +58: [2023-04-29 11:26:48,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +35: [2023-04-29 11:26:48,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +16: [2023-04-29 11:26:48,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 11:26:48,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 11:26:48,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +20: [2023-04-29 11:26:48,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 11:26:48,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +16: [2023-04-29 11:26:48,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 11:26:48,694] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 11:26:48,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +17: [2023-04-29 11:26:48,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +58: [2023-04-29 11:26:48,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +55: [2023-04-29 11:26:48,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +55: [2023-04-29 11:26:48,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +11: [2023-04-29 11:26:48,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 11:26:48,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 11:26:48,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 11:26:48,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +55: [2023-04-29 11:26:48,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +55: [2023-04-29 11:26:48,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +16: [2023-04-29 11:26:48,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 11:26:48,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 11:26:48,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 11:26:48,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +16: [2023-04-29 11:26:48,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +35: [2023-04-29 11:26:48,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +48: [2023-04-29 11:26:48,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 11:26:48,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 11:26:48,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 11:26:48,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 11:26:48,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 11:26:48,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 11:26:48,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +48: [2023-04-29 11:26:48,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 11:26:48,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 11:26:48,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +49: [2023-04-29 11:26:48,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +49: [2023-04-29 11:26:48,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +13: [2023-04-29 11:26:48,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 11:26:48,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +17: [2023-04-29 11:26:48,710] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +48: [2023-04-29 11:26:48,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +10: [2023-04-29 11:26:48,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +48: [2023-04-29 11:26:48,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +48: [2023-04-29 11:26:48,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... + 5: [2023-04-29 11:26:48,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +35: [2023-04-29 11:26:48,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +11: [2023-04-29 11:26:48,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 11:26:48,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +48: [2023-04-29 11:26:48,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 11:26:48,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +48: [2023-04-29 11:26:48,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 11:26:48,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +48: [2023-04-29 11:26:48,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 11:26:48,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +52: [2023-04-29 11:26:48,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +16: [2023-04-29 11:26:48,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 11:26:48,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:48,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +52: [2023-04-29 11:26:48,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +35: [2023-04-29 11:26:48,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +52: [2023-04-29 11:26:48,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +35: [2023-04-29 11:26:48,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +16: [2023-04-29 11:26:48,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 11:26:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +32: [2023-04-29 11:26:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +32: [2023-04-29 11:26:48,722] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +55: [2023-04-29 11:26:48,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 11:26:48,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +13: [2023-04-29 11:26:48,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +39: [2023-04-29 11:26:48,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +39: [2023-04-29 11:26:48,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 11:26:48,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +56: [2023-04-29 11:26:48,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +59: [2023-04-29 11:26:48,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +59: [2023-04-29 11:26:48,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +59: [2023-04-29 11:26:48,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +59: [2023-04-29 11:26:48,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +38: [2023-04-29 11:26:48,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 11:26:48,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +22: [2023-04-29 11:26:48,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +32: [2023-04-29 11:26:48,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +32: [2023-04-29 11:26:48,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +38: [2023-04-29 11:26:48,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 11:26:48,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +38: [2023-04-29 11:26:48,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 11:26:48,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +14: [2023-04-29 11:26:48,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +22: [2023-04-29 11:26:48,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +55: [2023-04-29 11:26:48,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +11: [2023-04-29 11:26:48,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 11:26:48,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +39: [2023-04-29 11:26:48,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +39: [2023-04-29 11:26:48,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +44: [2023-04-29 11:26:48,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +44: [2023-04-29 11:26:48,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +38: [2023-04-29 11:26:48,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 11:26:48,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 11:26:48,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +14: [2023-04-29 11:26:48,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +44: [2023-04-29 11:26:48,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +39: [2023-04-29 11:26:48,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +13: [2023-04-29 11:26:48,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +14: [2023-04-29 11:26:48,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +39: [2023-04-29 11:26:48,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +16: [2023-04-29 11:26:48,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 11:26:48,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 11:26:48,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 11:26:48,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +50: [2023-04-29 11:26:48,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +50: [2023-04-29 11:26:48,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +50: [2023-04-29 11:26:48,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +14: [2023-04-29 11:26:48,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +39: [2023-04-29 11:26:48,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +58: [2023-04-29 11:26:48,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 11:26:48,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 11:26:48,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +58: [2023-04-29 11:26:48,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 11:26:48,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +52: [2023-04-29 11:26:48,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +22: [2023-04-29 11:26:48,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +22: [2023-04-29 11:26:48,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 11:26:48,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +52: [2023-04-29 11:26:48,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +11: [2023-04-29 11:26:48,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 11:26:48,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 11:26:48,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:48,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 11:26:48,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 11:26:48,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +59: [2023-04-29 11:26:48,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +59: [2023-04-29 11:26:48,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +59: [2023-04-29 11:26:48,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +14: [2023-04-29 11:26:48,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:48,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 11:26:48,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 11:26:48,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +22: [2023-04-29 11:26:48,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 11:26:48,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 11:26:48,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 11:26:48,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +38: [2023-04-29 11:26:48,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +44: [2023-04-29 11:26:48,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +22: [2023-04-29 11:26:48,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +49: [2023-04-29 11:26:48,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 11:26:48,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +32: [2023-04-29 11:26:48,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 11:26:48,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 11:26:48,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 11:26:48,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 11:26:48,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:48,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +49: [2023-04-29 11:26:48,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +50: [2023-04-29 11:26:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 11:26:48,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +58: [2023-04-29 11:26:48,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 11:26:48,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:48,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +50: [2023-04-29 11:26:48,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 11:26:48,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +58: [2023-04-29 11:26:48,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 11:26:48,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 11:26:48,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +49: [2023-04-29 11:26:48,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +48: [2023-04-29 11:26:48,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +14: [2023-04-29 11:26:48,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +49: [2023-04-29 11:26:48,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +22: [2023-04-29 11:26:48,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +49: [2023-04-29 11:26:48,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +49: [2023-04-29 11:26:48,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +43: [2023-04-29 11:26:48,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +43: [2023-04-29 11:26:48,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +43: [2023-04-29 11:26:48,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +22: [2023-04-29 11:26:48,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +43: [2023-04-29 11:26:48,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +60: [2023-04-29 11:26:48,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +60: [2023-04-29 11:26:48,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +60: [2023-04-29 11:26:48,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +48: [2023-04-29 11:26:48,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +60: [2023-04-29 11:26:48,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +49: [2023-04-29 11:26:48,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... + 0: [2023-04-29 11:26:48,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +55: [2023-04-29 11:26:48,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +48: [2023-04-29 11:26:48,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 11:26:48,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +30: [2023-04-29 11:26:48,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 11:26:48,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 11:26:48,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 11:26:48,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +54: [2023-04-29 11:26:48,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +54: [2023-04-29 11:26:48,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +54: [2023-04-29 11:26:48,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +54: [2023-04-29 11:26:48,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +48: [2023-04-29 11:26:48,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 11:26:48,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +41: [2023-04-29 11:26:48,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +41: [2023-04-29 11:26:48,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +42: [2023-04-29 11:26:48,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +41: [2023-04-29 11:26:48,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +42: [2023-04-29 11:26:48,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +42: [2023-04-29 11:26:48,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +42: [2023-04-29 11:26:48,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_37-model_01-model_states.pt. +30: [2023-04-29 11:26:48,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +30: [2023-04-29 11:26:48,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +45: [2023-04-29 11:26:48,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +45: [2023-04-29 11:26:48,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +45: [2023-04-29 11:26:48,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +30: [2023-04-29 11:26:48,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +45: [2023-04-29 11:26:48,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +30: [2023-04-29 11:26:48,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +55: [2023-04-29 11:26:48,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +62: [2023-04-29 11:26:48,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +62: [2023-04-29 11:26:48,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +55: [2023-04-29 11:26:48,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +15: [2023-04-29 11:26:48,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 11:26:48,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 11:26:48,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 11:26:48,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +38: [2023-04-29 11:26:48,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +38: [2023-04-29 11:26:48,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +15: [2023-04-29 11:26:48,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 11:26:48,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +62: [2023-04-29 11:26:48,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +62: [2023-04-29 11:26:48,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. + 1: [2023-04-29 11:26:48,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +55: [2023-04-29 11:26:48,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +48: [2023-04-29 11:26:48,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +55: [2023-04-29 11:26:48,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +15: [2023-04-29 11:26:48,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 11:26:48,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 11:26:48,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 11:26:48,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +55: [2023-04-29 11:26:48,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 5: [2023-04-29 11:26:48,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 11:26:48,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 11:26:48,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 11:26:48,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 11:26:48,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 11:26:48,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 11:26:48,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 11:26:48,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 11:26:48,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +55: [2023-04-29 11:26:48,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +48: [2023-04-29 11:26:48,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +59: [2023-04-29 11:26:48,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +59: [2023-04-29 11:26:48,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +54: [2023-04-29 11:26:48,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +54: [2023-04-29 11:26:48,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +56: [2023-04-29 11:26:48,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +41: [2023-04-29 11:26:48,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +48: [2023-04-29 11:26:48,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 5: [2023-04-29 11:26:48,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +57: [2023-04-29 11:26:48,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +57: [2023-04-29 11:26:48,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +57: [2023-04-29 11:26:48,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +57: [2023-04-29 11:26:48,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +48: [2023-04-29 11:26:48,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 11:26:48,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +54: [2023-04-29 11:26:48,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +54: [2023-04-29 11:26:48,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 11:26:48,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +45: [2023-04-29 11:26:48,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 11:26:48,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +41: [2023-04-29 11:26:48,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 11:26:48,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +42: [2023-04-29 11:26:48,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt... +56: [2023-04-29 11:26:48,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +59: [2023-04-29 11:26:48,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +59: [2023-04-29 11:26:48,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +59: [2023-04-29 11:26:48,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +59: [2023-04-29 11:26:48,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +41: [2023-04-29 11:26:48,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +56: [2023-04-29 11:26:48,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +32: [2023-04-29 11:26:48,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 11:26:48,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 11:26:48,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 11:26:48,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +32: [2023-04-29 11:26:48,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 11:26:48,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +45: [2023-04-29 11:26:48,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 11:26:48,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +23: [2023-04-29 11:26:48,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +23: [2023-04-29 11:26:48,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 11:26:48,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +63: [2023-04-29 11:26:48,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +38: [2023-04-29 11:26:48,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 11:26:48,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 11:26:48,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +38: [2023-04-29 11:26:48,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +45: [2023-04-29 11:26:48,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 11:26:48,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +23: [2023-04-29 11:26:48,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +62: [2023-04-29 11:26:48,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 11:26:48,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +56: [2023-04-29 11:26:48,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +62: [2023-04-29 11:26:48,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +23: [2023-04-29 11:26:48,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +62: [2023-04-29 11:26:48,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 11:26:48,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 11:26:48,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +32: [2023-04-29 11:26:48,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +33: [2023-04-29 11:26:48,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +33: [2023-04-29 11:26:48,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +33: [2023-04-29 11:26:48,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +33: [2023-04-29 11:26:48,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +32: [2023-04-29 11:26:48,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +56: [2023-04-29 11:26:48,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +56: [2023-04-29 11:26:48,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +23: [2023-04-29 11:26:48,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:48,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 11:26:48,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 11:26:48,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +23: [2023-04-29 11:26:48,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:48,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +23: [2023-04-29 11:26:48,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:48,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +24: [2023-04-29 11:26:48,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 11:26:48,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 11:26:48,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 11:26:48,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +32: [2023-04-29 11:26:48,836] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +23: [2023-04-29 11:26:48,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +24: [2023-04-29 11:26:48,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +24: [2023-04-29 11:26:48,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +24: [2023-04-29 11:26:48,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 11:26:48,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +56: [2023-04-29 11:26:48,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +24: [2023-04-29 11:26:48,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:48,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +32: [2023-04-29 11:26:48,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +32: [2023-04-29 11:26:48,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +57: [2023-04-29 11:26:48,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 11:26:48,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 11:26:48,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 11:26:48,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 11:26:48,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +33: [2023-04-29 11:26:48,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 11:26:48,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +29: [2023-04-29 11:26:48,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +29: [2023-04-29 11:26:48,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 11:26:48,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +63: [2023-04-29 11:26:48,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +29: [2023-04-29 11:26:48,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 11:26:48,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 11:26:48,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 11:26:48,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +29: [2023-04-29 11:26:48,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +29: [2023-04-29 11:26:48,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 11:26:48,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +29: [2023-04-29 11:26:48,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 11:26:48,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +29: [2023-04-29 11:26:48,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 11:26:48,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 11:26:48,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +30: [2023-04-29 11:26:48,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 11:26:48,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 11:26:48,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 11:26:48,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 11:26:48,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +35: [2023-04-29 11:26:48,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +35: [2023-04-29 11:26:48,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +35: [2023-04-29 11:26:48,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +35: [2023-04-29 11:26:48,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. + 0: [2023-04-29 11:26:48,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 11:26:48,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,877] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +42: [2023-04-29 11:26:48,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 11:26:48,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 11:26:48,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 11:26:48,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 11:26:48,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +42: [2023-04-29 11:26:48,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +45: [2023-04-29 11:26:48,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +25: [2023-04-29 11:26:48,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 11:26:48,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 11:26:48,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 11:26:48,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +30: [2023-04-29 11:26:48,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +25: [2023-04-29 11:26:48,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 11:26:48,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +42: [2023-04-29 11:26:48,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_00-model_states.pt. +45: [2023-04-29 11:26:48,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +25: [2023-04-29 11:26:48,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +30: [2023-04-29 11:26:48,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +25: [2023-04-29 11:26:48,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +30: [2023-04-29 11:26:48,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +45: [2023-04-29 11:26:48,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +34: [2023-04-29 11:26:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 11:26:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 11:26:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 11:26:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 11:26:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 11:26:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 11:26:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 11:26:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +30: [2023-04-29 11:26:48,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +34: [2023-04-29 11:26:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 11:26:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 11:26:48,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 11:26:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +38: [2023-04-29 11:26:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 11:26:48,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 6: [2023-04-29 11:26:48,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +59: [2023-04-29 11:26:48,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 11:26:48,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 11:26:48,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 11:26:48,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 11:26:48,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +45: [2023-04-29 11:26:48,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +38: [2023-04-29 11:26:48,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 11:26:48,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +51: [2023-04-29 11:26:48,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +51: [2023-04-29 11:26:48,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +51: [2023-04-29 11:26:48,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +42: [2023-04-29 11:26:48,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt... +51: [2023-04-29 11:26:48,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +38: [2023-04-29 11:26:48,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 11:26:48,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +49: [2023-04-29 11:26:48,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 11:26:48,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +23: [2023-04-29 11:26:48,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 11:26:48,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +34: [2023-04-29 11:26:48,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +45: [2023-04-29 11:26:48,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 11:26:48,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +38: [2023-04-29 11:26:48,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +15: [2023-04-29 11:26:48,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 11:26:48,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +35: [2023-04-29 11:26:48,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +49: [2023-04-29 11:26:48,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +23: [2023-04-29 11:26:48,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +59: [2023-04-29 11:26:48,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +49: [2023-04-29 11:26:48,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 11:26:48,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +24: [2023-04-29 11:26:48,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +35: [2023-04-29 11:26:48,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 11:26:48,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +35: [2023-04-29 11:26:48,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 11:26:48,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +49: [2023-04-29 11:26:48,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +38: [2023-04-29 11:26:48,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +24: [2023-04-29 11:26:48,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 11:26:48,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 11:26:48,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +59: [2023-04-29 11:26:48,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 11:26:48,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +24: [2023-04-29 11:26:48,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 11:26:48,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +14: [2023-04-29 11:26:48,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +38: [2023-04-29 11:26:48,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +14: [2023-04-29 11:26:48,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +34: [2023-04-29 11:26:48,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... + 6: [2023-04-29 11:26:48,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +45: [2023-04-29 11:26:48,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +14: [2023-04-29 11:26:48,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 6: [2023-04-29 11:26:48,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +24: [2023-04-29 11:26:48,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +34: [2023-04-29 11:26:48,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +34: [2023-04-29 11:26:48,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +34: [2023-04-29 11:26:48,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +59: [2023-04-29 11:26:48,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +23: [2023-04-29 11:26:48,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +23: [2023-04-29 11:26:48,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +36: [2023-04-29 11:26:48,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 11:26:48,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 11:26:48,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 11:26:48,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 11:26:48,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 11:26:48,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 11:26:48,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 11:26:48,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 11:26:48,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 11:26:48,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 11:26:48,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 11:26:48,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 11:26:48,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 11:26:48,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 11:26:48,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 11:26:48,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 11:26:48,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +36: [2023-04-29 11:26:48,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 11:26:48,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +36: [2023-04-29 11:26:48,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +36: [2023-04-29 11:26:48,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +36: [2023-04-29 11:26:48,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... + 3: [2023-04-29 11:26:48,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +36: [2023-04-29 11:26:48,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +53: [2023-04-29 11:26:48,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +36: [2023-04-29 11:26:48,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +53: [2023-04-29 11:26:48,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +36: [2023-04-29 11:26:48,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +32: [2023-04-29 11:26:48,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 11:26:48,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 11:26:48,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +32: [2023-04-29 11:26:48,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 11:26:48,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +53: [2023-04-29 11:26:48,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +53: [2023-04-29 11:26:48,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +53: [2023-04-29 11:26:48,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +53: [2023-04-29 11:26:48,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +53: [2023-04-29 11:26:48,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +63: [2023-04-29 11:26:48,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +29: [2023-04-29 11:26:48,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +51: [2023-04-29 11:26:48,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 11:26:48,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 11:26:48,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 11:26:48,924] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 11:26:48,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +51: [2023-04-29 11:26:48,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +23: [2023-04-29 11:26:48,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +39: [2023-04-29 11:26:48,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +39: [2023-04-29 11:26:48,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +39: [2023-04-29 11:26:48,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +39: [2023-04-29 11:26:48,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +29: [2023-04-29 11:26:48,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +29: [2023-04-29 11:26:48,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 11:26:48,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 11:26:48,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 11:26:48,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 11:26:48,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +14: [2023-04-29 11:26:48,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 11:26:48,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 11:26:48,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 11:26:48,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 11:26:48,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +24: [2023-04-29 11:26:48,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 4: [2023-04-29 11:26:48,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 4: [2023-04-29 11:26:48,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 4: [2023-04-29 11:26:48,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +21: [2023-04-29 11:26:48,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 11:26:48,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 11:26:48,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 11:26:48,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 11:26:48,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +14: [2023-04-29 11:26:48,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 11:26:48,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +63: [2023-04-29 11:26:48,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +23: [2023-04-29 11:26:48,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 11:26:48,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +23: [2023-04-29 11:26:48,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 11:26:48,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 11:26:48,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 11:26:48,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 11:26:48,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 11:26:48,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +19: [2023-04-29 11:26:48,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +19: [2023-04-29 11:26:48,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +58: [2023-04-29 11:26:48,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +58: [2023-04-29 11:26:48,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +19: [2023-04-29 11:26:48,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 9: [2023-04-29 11:26:48,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 11:26:48,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +63: [2023-04-29 11:26:48,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +58: [2023-04-29 11:26:48,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. + 9: [2023-04-29 11:26:48,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +40: [2023-04-29 11:26:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 11:26:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 11:26:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 11:26:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 11:26:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 11:26:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 11:26:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 11:26:48,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 11:26:48,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 11:26:48,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +29: [2023-04-29 11:26:48,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +32: [2023-04-29 11:26:48,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +32: [2023-04-29 11:26:48,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +25: [2023-04-29 11:26:48,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +32: [2023-04-29 11:26:48,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 11:26:48,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 11:26:48,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +32: [2023-04-29 11:26:48,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +29: [2023-04-29 11:26:48,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +40: [2023-04-29 11:26:48,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +29: [2023-04-29 11:26:48,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +26: [2023-04-29 11:26:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +29: [2023-04-29 11:26:48,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +40: [2023-04-29 11:26:48,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +26: [2023-04-29 11:26:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 11:26:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +48: [2023-04-29 11:26:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +48: [2023-04-29 11:26:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +31: [2023-04-29 11:26:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 11:26:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 11:26:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 11:26:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 11:26:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 11:26:48,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +40: [2023-04-29 11:26:48,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 11:26:48,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +40: [2023-04-29 11:26:48,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +40: [2023-04-29 11:26:48,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +40: [2023-04-29 11:26:48,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +40: [2023-04-29 11:26:48,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +48: [2023-04-29 11:26:48,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +48: [2023-04-29 11:26:48,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +40: [2023-04-29 11:26:48,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 9: [2023-04-29 11:26:48,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +49: [2023-04-29 11:26:48,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +26: [2023-04-29 11:26:48,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +49: [2023-04-29 11:26:48,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +49: [2023-04-29 11:26:48,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +26: [2023-04-29 11:26:48,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +12: [2023-04-29 11:26:48,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +12: [2023-04-29 11:26:48,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +12: [2023-04-29 11:26:48,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +12: [2023-04-29 11:26:48,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 11:26:48,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +26: [2023-04-29 11:26:48,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 11:26:48,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +26: [2023-04-29 11:26:48,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 11:26:48,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 11:26:48,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 11:26:48,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +18: [2023-04-29 11:26:48,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +18: [2023-04-29 11:26:48,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +18: [2023-04-29 11:26:48,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 11:26:48,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 4: [2023-04-29 11:26:48,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +49: [2023-04-29 11:26:48,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. + 9: [2023-04-29 11:26:48,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +34: [2023-04-29 11:26:48,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 11:26:48,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +12: [2023-04-29 11:26:48,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +34: [2023-04-29 11:26:48,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 11:26:48,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +12: [2023-04-29 11:26:48,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +12: [2023-04-29 11:26:48,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +12: [2023-04-29 11:26:48,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 11:26:48,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 11:26:48,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 11:26:48,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +36: [2023-04-29 11:26:48,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 11:26:48,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +19: [2023-04-29 11:26:48,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 11:26:48,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 11:26:48,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 11:26:48,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 11:26:48,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +53: [2023-04-29 11:26:48,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +58: [2023-04-29 11:26:48,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 11:26:48,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 11:26:48,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +19: [2023-04-29 11:26:48,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +49: [2023-04-29 11:26:48,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 11:26:48,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 11:26:48,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 9: [2023-04-29 11:26:48,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +25: [2023-04-29 11:26:48,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +34: [2023-04-29 11:26:48,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +25: [2023-04-29 11:26:48,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:48,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 1: [2023-04-29 11:26:48,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 1: [2023-04-29 11:26:48,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 1: [2023-04-29 11:26:48,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +48: [2023-04-29 11:26:48,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +25: [2023-04-29 11:26:48,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +53: [2023-04-29 11:26:48,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 11:26:48,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 11:26:48,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +14: [2023-04-29 11:26:48,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 11:26:48,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +34: [2023-04-29 11:26:48,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +27: [2023-04-29 11:26:48,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 11:26:48,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 11:26:48,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +49: [2023-04-29 11:26:48,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +49: [2023-04-29 11:26:48,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 3: [2023-04-29 11:26:48,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 11:26:48,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +48: [2023-04-29 11:26:48,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 11:26:48,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 11:26:48,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 11:26:48,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +36: [2023-04-29 11:26:48,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 11:26:48,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 11:26:48,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +14: [2023-04-29 11:26:48,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +48: [2023-04-29 11:26:48,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 11:26:48,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:48,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 11:26:48,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 11:26:48,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 11:26:48,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 11:26:48,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +49: [2023-04-29 11:26:48,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +36: [2023-04-29 11:26:48,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 11:26:48,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +14: [2023-04-29 11:26:48,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +49: [2023-04-29 11:26:48,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +21: [2023-04-29 11:26:48,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +34: [2023-04-29 11:26:48,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 11:26:49,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +53: [2023-04-29 11:26:49,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +20: [2023-04-29 11:26:49,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 11:26:49,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 11:26:49,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 11:26:49,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 11:26:49,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +34: [2023-04-29 11:26:49,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:49,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 11:26:49,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 11:26:49,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 11:26:49,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +21: [2023-04-29 11:26:49,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 11:26:49,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 11:26:49,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 11:26:49,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +14: [2023-04-29 11:26:49,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +14: [2023-04-29 11:26:49,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 1: [2023-04-29 11:26:49,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +53: [2023-04-29 11:26:49,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 11:26:49,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 11:26:49,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 11:26:49,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 11:26:49,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +63: [2023-04-29 11:26:49,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +63: [2023-04-29 11:26:49,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +63: [2023-04-29 11:26:49,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 11:26:49,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 11:26:49,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +36: [2023-04-29 11:26:49,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +28: [2023-04-29 11:26:49,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 11:26:49,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 11:26:49,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 11:26:49,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +39: [2023-04-29 11:26:49,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 11:26:49,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 11:26:49,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 11:26:49,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +26: [2023-04-29 11:26:49,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +59: [2023-04-29 11:26:49,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 11:26:49,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 11:26:49,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +56: [2023-04-29 11:26:49,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +56: [2023-04-29 11:26:49,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +28: [2023-04-29 11:26:49,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 11:26:49,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 11:26:49,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +28: [2023-04-29 11:26:49,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +63: [2023-04-29 11:26:49,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 0: [2023-04-29 11:26:49,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 0: [2023-04-29 11:26:49,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +63: [2023-04-29 11:26:49,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 11:26:49,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +59: [2023-04-29 11:26:49,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +28: [2023-04-29 11:26:49,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +28: [2023-04-29 11:26:49,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 11:26:49,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +39: [2023-04-29 11:26:49,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +39: [2023-04-29 11:26:49,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +39: [2023-04-29 11:26:49,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +53: [2023-04-29 11:26:49,026] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +56: [2023-04-29 11:26:49,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +56: [2023-04-29 11:26:49,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +55: [2023-04-29 11:26:49,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +55: [2023-04-29 11:26:49,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +26: [2023-04-29 11:26:49,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 11:26:49,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 11:26:49,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +40: [2023-04-29 11:26:49,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 11:26:49,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +31: [2023-04-29 11:26:49,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +18: [2023-04-29 11:26:49,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +55: [2023-04-29 11:26:49,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +55: [2023-04-29 11:26:49,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +18: [2023-04-29 11:26:49,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +40: [2023-04-29 11:26:49,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +12: [2023-04-29 11:26:49,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +39: [2023-04-29 11:26:49,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +10: [2023-04-29 11:26:49,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +10: [2023-04-29 11:26:49,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +39: [2023-04-29 11:26:49,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 11:26:49,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 11:26:49,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +31: [2023-04-29 11:26:49,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 11:26:49,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 11:26:49,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 11:26:49,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +18: [2023-04-29 11:26:49,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +18: [2023-04-29 11:26:49,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +12: [2023-04-29 11:26:49,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 11:26:49,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 11:26:49,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 11:26:49,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +12: [2023-04-29 11:26:49,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 11:26:49,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 11:26:49,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 11:26:49,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +39: [2023-04-29 11:26:49,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... + 4: [2023-04-29 11:26:49,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 4: [2023-04-29 11:26:49,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 4: [2023-04-29 11:26:49,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +19: [2023-04-29 11:26:49,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +40: [2023-04-29 11:26:49,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +19: [2023-04-29 11:26:49,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 11:26:49,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +10: [2023-04-29 11:26:49,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 11:26:49,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 11:26:49,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 11:26:49,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 11:26:49,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +26: [2023-04-29 11:26:49,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +49: [2023-04-29 11:26:49,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +19: [2023-04-29 11:26:49,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +59: [2023-04-29 11:26:49,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +59: [2023-04-29 11:26:49,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. + 0: [2023-04-29 11:26:49,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 11:26:49,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +59: [2023-04-29 11:26:49,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +59: [2023-04-29 11:26:49,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +10: [2023-04-29 11:26:49,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 11:26:49,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +15: [2023-04-29 11:26:49,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +15: [2023-04-29 11:26:49,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +42: [2023-04-29 11:26:49,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +42: [2023-04-29 11:26:49,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +27: [2023-04-29 11:26:49,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 11:26:49,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +42: [2023-04-29 11:26:49,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +42: [2023-04-29 11:26:49,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_38-model_01-model_states.pt. +49: [2023-04-29 11:26:49,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... + 2: [2023-04-29 11:26:49,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +55: [2023-04-29 11:26:49,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 11:26:49,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 11:26:49,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +26: [2023-04-29 11:26:49,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +56: [2023-04-29 11:26:49,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +56: [2023-04-29 11:26:49,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +10: [2023-04-29 11:26:49,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +49: [2023-04-29 11:26:49,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 11:26:49,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 11:26:49,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 11:26:49,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 11:26:49,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +26: [2023-04-29 11:26:49,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +26: [2023-04-29 11:26:49,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +56: [2023-04-29 11:26:49,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +10: [2023-04-29 11:26:49,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 11:26:49,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 11:26:49,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 11:26:49,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 11:26:49,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +56: [2023-04-29 11:26:49,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 11:26:49,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 11:26:49,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 11:26:49,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 11:26:49,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +18: [2023-04-29 11:26:49,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +46: [2023-04-29 11:26:49,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 11:26:49,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 11:26:49,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 11:26:49,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 11:26:49,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 11:26:49,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 11:26:49,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 11:26:49,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +12: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +57: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +49: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +57: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +55: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +10: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +55: [2023-04-29 11:26:49,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +55: [2023-04-29 11:26:49,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 11:26:49,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 11:26:49,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 11:26:49,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 11:26:49,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +31: [2023-04-29 11:26:49,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +37: [2023-04-29 11:26:49,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 11:26:49,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +40: [2023-04-29 11:26:49,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 11:26:49,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +10: [2023-04-29 11:26:49,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 11:26:49,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 11:26:49,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +39: [2023-04-29 11:26:49,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 11:26:49,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +12: [2023-04-29 11:26:49,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +56: [2023-04-29 11:26:49,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +39: [2023-04-29 11:26:49,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +10: [2023-04-29 11:26:49,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +40: [2023-04-29 11:26:49,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 11:26:49,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +17: [2023-04-29 11:26:49,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 11:26:49,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 11:26:49,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +56: [2023-04-29 11:26:49,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +17: [2023-04-29 11:26:49,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +49: [2023-04-29 11:26:49,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +56: [2023-04-29 11:26:49,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 11:26:49,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +18: [2023-04-29 11:26:49,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +46: [2023-04-29 11:26:49,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +56: [2023-04-29 11:26:49,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 11:26:49,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +18: [2023-04-29 11:26:49,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 11:26:49,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +40: [2023-04-29 11:26:49,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 11:26:49,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 11:26:49,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +56: [2023-04-29 11:26:49,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 11:26:49,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 11:26:49,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 11:26:49,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +46: [2023-04-29 11:26:49,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +20: [2023-04-29 11:26:49,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +57: [2023-04-29 11:26:49,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 11:26:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 11:26:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +20: [2023-04-29 11:26:49,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +57: [2023-04-29 11:26:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +57: [2023-04-29 11:26:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +57: [2023-04-29 11:26:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 11:26:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +46: [2023-04-29 11:26:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +37: [2023-04-29 11:26:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 11:26:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +46: [2023-04-29 11:26:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +37: [2023-04-29 11:26:49,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... + 1: [2023-04-29 11:26:49,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +61: [2023-04-29 11:26:49,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +17: [2023-04-29 11:26:49,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:49,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +32: [2023-04-29 11:26:49,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +61: [2023-04-29 11:26:49,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +57: [2023-04-29 11:26:49,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +17: [2023-04-29 11:26:49,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +57: [2023-04-29 11:26:49,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 11:26:49,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +49: [2023-04-29 11:26:49,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +17: [2023-04-29 11:26:49,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:49,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +20: [2023-04-29 11:26:49,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 11:26:49,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +32: [2023-04-29 11:26:49,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. + 8: [2023-04-29 11:26:49,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +37: [2023-04-29 11:26:49,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +17: [2023-04-29 11:26:49,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +37: [2023-04-29 11:26:49,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +37: [2023-04-29 11:26:49,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... + 1: [2023-04-29 11:26:49,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +37: [2023-04-29 11:26:49,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +37: [2023-04-29 11:26:49,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 11:26:49,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 11:26:49,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +49: [2023-04-29 11:26:49,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +27: [2023-04-29 11:26:49,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +59: [2023-04-29 11:26:49,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 11:26:49,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +28: [2023-04-29 11:26:49,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 11:26:49,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +42: [2023-04-29 11:26:49,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +59: [2023-04-29 11:26:49,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +28: [2023-04-29 11:26:49,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 11:26:49,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 11:26:49,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 11:26:49,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 11:26:49,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 11:26:49,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +63: [2023-04-29 11:26:49,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 11:26:49,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +28: [2023-04-29 11:26:49,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 11:26:49,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +42: [2023-04-29 11:26:49,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +14: [2023-04-29 11:26:49,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 11:26:49,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 11:26:49,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 11:26:49,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +14: [2023-04-29 11:26:49,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 11:26:49,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 11:26:49,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +44: [2023-04-29 11:26:49,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 11:26:49,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 11:26:49,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 11:26:49,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 11:26:49,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 11:26:49,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 11:26:49,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 11:26:49,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 1: [2023-04-29 11:26:49,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +22: [2023-04-29 11:26:49,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 11:26:49,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 11:26:49,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 11:26:49,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 11:26:49,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 11:26:49,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 11:26:49,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 11:26:49,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 11:26:49,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 11:26:49,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +20: [2023-04-29 11:26:49,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 11:26:49,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 11:26:49,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +63: [2023-04-29 11:26:49,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +63: [2023-04-29 11:26:49,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 11:26:49,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +44: [2023-04-29 11:26:49,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 11:26:49,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +13: [2023-04-29 11:26:49,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 11:26:49,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +22: [2023-04-29 11:26:49,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 11:26:49,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 11:26:49,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +44: [2023-04-29 11:26:49,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +44: [2023-04-29 11:26:49,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +32: [2023-04-29 11:26:49,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +44: [2023-04-29 11:26:49,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +22: [2023-04-29 11:26:49,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +44: [2023-04-29 11:26:49,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +44: [2023-04-29 11:26:49,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +22: [2023-04-29 11:26:49,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +22: [2023-04-29 11:26:49,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:49,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +32: [2023-04-29 11:26:49,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +20: [2023-04-29 11:26:49,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +20: [2023-04-29 11:26:49,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 11:26:49,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 11:26:49,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +18: [2023-04-29 11:26:49,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +18: [2023-04-29 11:26:49,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +18: [2023-04-29 11:26:49,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +32: [2023-04-29 11:26:49,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 11:26:49,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +45: [2023-04-29 11:26:49,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +45: [2023-04-29 11:26:49,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +45: [2023-04-29 11:26:49,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +45: [2023-04-29 11:26:49,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +28: [2023-04-29 11:26:49,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +46: [2023-04-29 11:26:49,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +10: [2023-04-29 11:26:49,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 11:26:49,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +23: [2023-04-29 11:26:49,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +23: [2023-04-29 11:26:49,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +23: [2023-04-29 11:26:49,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +28: [2023-04-29 11:26:49,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 11:26:49,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 3: [2023-04-29 11:26:49,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 3: [2023-04-29 11:26:49,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +17: [2023-04-29 11:26:49,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +17: [2023-04-29 11:26:49,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +17: [2023-04-29 11:26:49,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 3: [2023-04-29 11:26:49,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +17: [2023-04-29 11:26:49,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 3: [2023-04-29 11:26:49,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +37: [2023-04-29 11:26:49,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +10: [2023-04-29 11:26:49,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +63: [2023-04-29 11:26:49,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 11:26:49,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 11:26:49,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 11:26:49,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +61: [2023-04-29 11:26:49,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 11:26:49,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +10: [2023-04-29 11:26:49,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 6: [2023-04-29 11:26:49,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 6: [2023-04-29 11:26:49,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 6: [2023-04-29 11:26:49,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 0: [2023-04-29 11:26:49,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +53: [2023-04-29 11:26:49,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +53: [2023-04-29 11:26:49,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +53: [2023-04-29 11:26:49,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +53: [2023-04-29 11:26:49,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +46: [2023-04-29 11:26:49,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +59: [2023-04-29 11:26:49,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +63: [2023-04-29 11:26:49,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,131] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +37: [2023-04-29 11:26:49,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 11:26:49,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 11:26:49,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +10: [2023-04-29 11:26:49,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +61: [2023-04-29 11:26:49,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 11:26:49,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 11:26:49,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +17: [2023-04-29 11:26:49,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +56: [2023-04-29 11:26:49,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 11:26:49,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 11:26:49,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 11:26:49,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +37: [2023-04-29 11:26:49,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 11:26:49,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +57: [2023-04-29 11:26:49,139] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +17: [2023-04-29 11:26:49,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 11:26:49,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +46: [2023-04-29 11:26:49,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 11:26:49,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +39: [2023-04-29 11:26:49,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +18: [2023-04-29 11:26:49,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +57: [2023-04-29 11:26:49,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +45: [2023-04-29 11:26:49,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +56: [2023-04-29 11:26:49,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +10: [2023-04-29 11:26:49,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +59: [2023-04-29 11:26:49,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +10: [2023-04-29 11:26:49,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +45: [2023-04-29 11:26:49,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +45: [2023-04-29 11:26:49,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 11:26:49,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +46: [2023-04-29 11:26:49,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +15: [2023-04-29 11:26:49,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +56: [2023-04-29 11:26:49,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +56: [2023-04-29 11:26:49,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +17: [2023-04-29 11:26:49,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 11:26:49,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +18: [2023-04-29 11:26:49,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 11:26:49,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +56: [2023-04-29 11:26:49,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +56: [2023-04-29 11:26:49,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +17: [2023-04-29 11:26:49,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +59: [2023-04-29 11:26:49,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +59: [2023-04-29 11:26:49,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +23: [2023-04-29 11:26:49,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +23: [2023-04-29 11:26:49,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +23: [2023-04-29 11:26:49,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 11:26:49,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 11:26:49,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +56: [2023-04-29 11:26:49,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... + 3: [2023-04-29 11:26:49,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +59: [2023-04-29 11:26:49,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 11:26:49,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +56: [2023-04-29 11:26:49,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +17: [2023-04-29 11:26:49,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 11:26:49,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 11:26:49,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +11: [2023-04-29 11:26:49,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 11:26:49,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 11:26:49,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 11:26:49,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:49,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +37: [2023-04-29 11:26:49,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +10: [2023-04-29 11:26:49,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 11:26:49,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 11:26:49,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 11:26:49,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +56: [2023-04-29 11:26:49,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 11:26:49,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +59: [2023-04-29 11:26:49,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... + 3: [2023-04-29 11:26:49,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +15: [2023-04-29 11:26:49,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +10: [2023-04-29 11:26:49,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 11:26:49,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 11:26:49,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 11:26:49,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +61: [2023-04-29 11:26:49,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +15: [2023-04-29 11:26:49,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +53: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +56: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +22: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +44: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +11: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +43: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +53: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 11:26:49,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +11: [2023-04-29 11:26:49,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 11:26:49,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +53: [2023-04-29 11:26:49,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +56: [2023-04-29 11:26:49,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +12: [2023-04-29 11:26:49,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +46: [2023-04-29 11:26:49,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +12: [2023-04-29 11:26:49,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +12: [2023-04-29 11:26:49,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +12: [2023-04-29 11:26:49,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 6: [2023-04-29 11:26:49,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +44: [2023-04-29 11:26:49,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +61: [2023-04-29 11:26:49,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +15: [2023-04-29 11:26:49,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +53: [2023-04-29 11:26:49,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +13: [2023-04-29 11:26:49,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +61: [2023-04-29 11:26:49,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +43: [2023-04-29 11:26:49,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +37: [2023-04-29 11:26:49,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +10: [2023-04-29 11:26:49,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +43: [2023-04-29 11:26:49,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +44: [2023-04-29 11:26:49,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +44: [2023-04-29 11:26:49,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +43: [2023-04-29 11:26:49,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 11:26:49,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +10: [2023-04-29 11:26:49,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +15: [2023-04-29 11:26:49,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +39: [2023-04-29 11:26:49,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +15: [2023-04-29 11:26:49,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +43: [2023-04-29 11:26:49,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 11:26:49,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +43: [2023-04-29 11:26:49,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 11:26:49,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... + 7: [2023-04-29 11:26:49,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 11:26:49,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +57: [2023-04-29 11:26:49,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 11:26:49,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 11:26:49,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 11:26:49,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 11:26:49,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 11:26:49,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 11:26:49,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 11:26:49,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 11:26:49,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +10: [2023-04-29 11:26:49,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +52: [2023-04-29 11:26:49,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +37: [2023-04-29 11:26:49,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +17: [2023-04-29 11:26:49,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +57: [2023-04-29 11:26:49,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +17: [2023-04-29 11:26:49,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +39: [2023-04-29 11:26:49,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +22: [2023-04-29 11:26:49,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 11:26:49,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 11:26:49,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 11:26:49,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 11:26:49,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +52: [2023-04-29 11:26:49,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +46: [2023-04-29 11:26:49,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 11:26:49,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 11:26:49,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 11:26:49,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 11:26:49,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +52: [2023-04-29 11:26:49,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +52: [2023-04-29 11:26:49,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +10: [2023-04-29 11:26:49,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +46: [2023-04-29 11:26:49,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:49,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +52: [2023-04-29 11:26:49,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +13: [2023-04-29 11:26:49,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 11:26:49,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +52: [2023-04-29 11:26:49,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +52: [2023-04-29 11:26:49,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +56: [2023-04-29 11:26:49,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 11:26:49,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +56: [2023-04-29 11:26:49,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +17: [2023-04-29 11:26:49,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +37: [2023-04-29 11:26:49,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +22: [2023-04-29 11:26:49,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 11:26:49,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +17: [2023-04-29 11:26:49,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +44: [2023-04-29 11:26:49,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 11:26:49,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 11:26:49,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +10: [2023-04-29 11:26:49,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 11:26:49,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 11:26:49,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +12: [2023-04-29 11:26:49,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 11:26:49,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +12: [2023-04-29 11:26:49,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +44: [2023-04-29 11:26:49,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:49,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +63: [2023-04-29 11:26:49,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +63: [2023-04-29 11:26:49,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +63: [2023-04-29 11:26:49,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +63: [2023-04-29 11:26:49,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +11: [2023-04-29 11:26:49,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +11: [2023-04-29 11:26:49,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +44: [2023-04-29 11:26:49,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +44: [2023-04-29 11:26:49,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +22: [2023-04-29 11:26:49,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 11:26:49,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 11:26:49,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 11:26:49,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +22: [2023-04-29 11:26:49,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +22: [2023-04-29 11:26:49,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 11:26:49,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 11:26:49,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +18: [2023-04-29 11:26:49,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 11:26:49,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 11:26:49,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 11:26:49,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 3: [2023-04-29 11:26:49,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 11:26:49,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +34: [2023-04-29 11:26:49,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +34: [2023-04-29 11:26:49,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +19: [2023-04-29 11:26:49,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 11:26:49,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 11:26:49,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 11:26:49,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +19: [2023-04-29 11:26:49,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +34: [2023-04-29 11:26:49,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. + 5: [2023-04-29 11:26:49,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +34: [2023-04-29 11:26:49,216] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +23: [2023-04-29 11:26:49,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 11:26:49,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +17: [2023-04-29 11:26:49,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 11:26:49,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 11:26:49,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 11:26:49,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 11:26:49,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 11:26:49,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 11:26:49,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +17: [2023-04-29 11:26:49,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +23: [2023-04-29 11:26:49,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +23: [2023-04-29 11:26:49,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +18: [2023-04-29 11:26:49,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +11: [2023-04-29 11:26:49,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +52: [2023-04-29 11:26:49,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +63: [2023-04-29 11:26:49,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +18: [2023-04-29 11:26:49,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +43: [2023-04-29 11:26:49,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 11:26:49,224] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +38: [2023-04-29 11:26:49,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +17: [2023-04-29 11:26:49,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +17: [2023-04-29 11:26:49,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +38: [2023-04-29 11:26:49,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +38: [2023-04-29 11:26:49,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +63: [2023-04-29 11:26:49,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +11: [2023-04-29 11:26:49,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +23: [2023-04-29 11:26:49,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +36: [2023-04-29 11:26:49,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +36: [2023-04-29 11:26:49,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. + 3: [2023-04-29 11:26:49,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:49,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +36: [2023-04-29 11:26:49,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +43: [2023-04-29 11:26:49,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 11:26:49,228] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +18: [2023-04-29 11:26:49,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +63: [2023-04-29 11:26:49,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 11:26:49,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +17: [2023-04-29 11:26:49,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +17: [2023-04-29 11:26:49,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +17: [2023-04-29 11:26:49,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +43: [2023-04-29 11:26:49,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 11:26:49,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +23: [2023-04-29 11:26:49,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 7: [2023-04-29 11:26:49,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +11: [2023-04-29 11:26:49,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 6: [2023-04-29 11:26:49,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 6: [2023-04-29 11:26:49,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 6: [2023-04-29 11:26:49,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 11:26:49,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +52: [2023-04-29 11:26:49,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 11:26:49,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +52: [2023-04-29 11:26:49,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 8: [2023-04-29 11:26:49,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 8: [2023-04-29 11:26:49,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +34: [2023-04-29 11:26:49,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +34: [2023-04-29 11:26:49,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 7: [2023-04-29 11:26:49,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +40: [2023-04-29 11:26:49,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +40: [2023-04-29 11:26:49,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +40: [2023-04-29 11:26:49,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +40: [2023-04-29 11:26:49,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +34: [2023-04-29 11:26:49,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +34: [2023-04-29 11:26:49,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 11:26:49,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 11:26:49,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:49,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 11:26:49,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 11:26:49,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 11:26:49,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 11:26:49,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 11:26:49,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 11:26:49,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 11:26:49,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 11:26:49,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +12: [2023-04-29 11:26:49,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +43: [2023-04-29 11:26:49,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 11:26:49,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +43: [2023-04-29 11:26:49,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 11:26:49,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 11:26:49,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 11:26:49,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 11:26:49,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 11:26:49,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +52: [2023-04-29 11:26:49,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 11:26:49,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +11: [2023-04-29 11:26:49,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +11: [2023-04-29 11:26:49,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 11:26:49,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +11: [2023-04-29 11:26:49,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +12: [2023-04-29 11:26:49,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +52: [2023-04-29 11:26:49,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 11:26:49,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +27: [2023-04-29 11:26:49,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +11: [2023-04-29 11:26:49,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 11:26:49,271] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +27: [2023-04-29 11:26:49,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +11: [2023-04-29 11:26:49,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 8: [2023-04-29 11:26:49,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +40: [2023-04-29 11:26:49,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +19: [2023-04-29 11:26:49,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +40: [2023-04-29 11:26:49,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +40: [2023-04-29 11:26:49,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 11:26:49,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 5: [2023-04-29 11:26:49,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 5: [2023-04-29 11:26:49,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 5: [2023-04-29 11:26:49,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +19: [2023-04-29 11:26:49,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +30: [2023-04-29 11:26:49,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +30: [2023-04-29 11:26:49,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +30: [2023-04-29 11:26:49,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +30: [2023-04-29 11:26:49,290] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +63: [2023-04-29 11:26:49,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +19: [2023-04-29 11:26:49,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 11:26:49,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +63: [2023-04-29 11:26:49,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +63: [2023-04-29 11:26:49,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 11:26:49,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +39: [2023-04-29 11:26:49,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +39: [2023-04-29 11:26:49,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +39: [2023-04-29 11:26:49,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +63: [2023-04-29 11:26:49,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +19: [2023-04-29 11:26:49,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 11:26:49,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 11:26:49,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 11:26:49,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +41: [2023-04-29 11:26:49,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 11:26:49,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 11:26:49,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 11:26:49,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 11:26:49,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 11:26:49,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 11:26:49,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 11:26:49,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 11:26:49,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +13: [2023-04-29 11:26:49,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +27: [2023-04-29 11:26:49,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 11:26:49,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +13: [2023-04-29 11:26:49,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +28: [2023-04-29 11:26:49,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +28: [2023-04-29 11:26:49,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +28: [2023-04-29 11:26:49,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +13: [2023-04-29 11:26:49,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +28: [2023-04-29 11:26:49,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +11: [2023-04-29 11:26:49,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +63: [2023-04-29 11:26:49,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +11: [2023-04-29 11:26:49,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 11:26:49,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 9: [2023-04-29 11:26:49,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 9: [2023-04-29 11:26:49,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 9: [2023-04-29 11:26:49,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +41: [2023-04-29 11:26:49,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +41: [2023-04-29 11:26:49,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 11:26:49,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +49: [2023-04-29 11:26:49,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +49: [2023-04-29 11:26:49,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +49: [2023-04-29 11:26:49,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +49: [2023-04-29 11:26:49,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +41: [2023-04-29 11:26:49,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +41: [2023-04-29 11:26:49,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +41: [2023-04-29 11:26:49,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +63: [2023-04-29 11:26:49,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +41: [2023-04-29 11:26:49,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +63: [2023-04-29 11:26:49,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +41: [2023-04-29 11:26:49,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +19: [2023-04-29 11:26:49,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +54: [2023-04-29 11:26:49,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 11:26:49,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 11:26:49,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 11:26:49,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 11:26:49,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 11:26:49,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 11:26:49,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +54: [2023-04-29 11:26:49,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 11:26:49,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 11:26:49,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 11:26:49,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 11:26:49,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 11:26:49,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 11:26:49,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 11:26:49,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 11:26:49,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +31: [2023-04-29 11:26:49,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +31: [2023-04-29 11:26:49,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +31: [2023-04-29 11:26:49,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +31: [2023-04-29 11:26:49,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +30: [2023-04-29 11:26:49,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +30: [2023-04-29 11:26:49,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +54: [2023-04-29 11:26:49,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +54: [2023-04-29 11:26:49,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +30: [2023-04-29 11:26:49,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +54: [2023-04-29 11:26:49,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +54: [2023-04-29 11:26:49,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +54: [2023-04-29 11:26:49,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 11:26:49,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 11:26:49,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 11:26:49,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +62: [2023-04-29 11:26:49,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 11:26:49,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +30: [2023-04-29 11:26:49,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +62: [2023-04-29 11:26:49,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +54: [2023-04-29 11:26:49,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +54: [2023-04-29 11:26:49,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +62: [2023-04-29 11:26:49,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +54: [2023-04-29 11:26:49,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +62: [2023-04-29 11:26:49,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +19: [2023-04-29 11:26:49,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 11:26:49,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 11:26:49,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 11:26:49,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +39: [2023-04-29 11:26:49,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +25: [2023-04-29 11:26:49,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +25: [2023-04-29 11:26:49,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +25: [2023-04-29 11:26:49,329] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +39: [2023-04-29 11:26:49,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 11:26:49,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +24: [2023-04-29 11:26:49,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +24: [2023-04-29 11:26:49,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 9: [2023-04-29 11:26:49,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 11:26:49,331] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 8: [2023-04-29 11:26:49,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +24: [2023-04-29 11:26:49,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +28: [2023-04-29 11:26:49,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +11: [2023-04-29 11:26:49,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +60: [2023-04-29 11:26:49,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +60: [2023-04-29 11:26:49,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +60: [2023-04-29 11:26:49,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +11: [2023-04-29 11:26:49,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +60: [2023-04-29 11:26:49,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +60: [2023-04-29 11:26:49,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +60: [2023-04-29 11:26:49,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +60: [2023-04-29 11:26:49,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 11:26:49,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 11:26:49,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +13: [2023-04-29 11:26:49,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 11:26:49,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +39: [2023-04-29 11:26:49,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 11:26:49,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +13: [2023-04-29 11:26:49,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +49: [2023-04-29 11:26:49,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 11:26:49,336] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +28: [2023-04-29 11:26:49,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 11:26:49,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +28: [2023-04-29 11:26:49,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +49: [2023-04-29 11:26:49,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 11:26:49,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +60: [2023-04-29 11:26:49,338] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +60: [2023-04-29 11:26:49,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +60: [2023-04-29 11:26:49,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 11:26:49,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +61: [2023-04-29 11:26:49,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +61: [2023-04-29 11:26:49,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +61: [2023-04-29 11:26:49,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +11: [2023-04-29 11:26:49,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +11: [2023-04-29 11:26:49,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +60: [2023-04-29 11:26:49,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 11:26:49,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 11:26:49,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +31: [2023-04-29 11:26:49,342] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +60: [2023-04-29 11:26:49,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +31: [2023-04-29 11:26:49,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 11:26:49,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:49,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +31: [2023-04-29 11:26:49,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +29: [2023-04-29 11:26:49,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +29: [2023-04-29 11:26:49,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +29: [2023-04-29 11:26:49,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +29: [2023-04-29 11:26:49,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 8: [2023-04-29 11:26:49,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +25: [2023-04-29 11:26:49,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 8: [2023-04-29 11:26:49,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +24: [2023-04-29 11:26:49,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 11:26:49,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +25: [2023-04-29 11:26:49,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 11:26:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 11:26:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 11:26:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 11:26:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 11:26:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 11:26:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 11:26:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 11:26:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 11:26:49,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +33: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +51: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +47: [2023-04-29 11:26:49,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +25: [2023-04-29 11:26:49,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 11:26:49,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +24: [2023-04-29 11:26:49,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +24: [2023-04-29 11:26:49,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +33: [2023-04-29 11:26:49,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +33: [2023-04-29 11:26:49,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +33: [2023-04-29 11:26:49,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 11:26:49,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 11:26:49,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 11:26:49,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +51: [2023-04-29 11:26:49,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +24: [2023-04-29 11:26:49,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +51: [2023-04-29 11:26:49,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 11:26:49,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +51: [2023-04-29 11:26:49,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 11:26:49,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +47: [2023-04-29 11:26:49,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 11:26:49,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 11:26:49,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +47: [2023-04-29 11:26:49,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +47: [2023-04-29 11:26:49,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +47: [2023-04-29 11:26:49,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +30: [2023-04-29 11:26:49,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +33: [2023-04-29 11:26:49,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 11:26:49,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 11:26:49,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 11:26:49,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +61: [2023-04-29 11:26:49,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +16: [2023-04-29 11:26:49,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +33: [2023-04-29 11:26:49,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +33: [2023-04-29 11:26:49,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +33: [2023-04-29 11:26:49,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 11:26:49,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +14: [2023-04-29 11:26:49,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +14: [2023-04-29 11:26:49,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +14: [2023-04-29 11:26:49,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +27: [2023-04-29 11:26:49,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 11:26:49,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +14: [2023-04-29 11:26:49,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +33: [2023-04-29 11:26:49,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +61: [2023-04-29 11:26:49,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 11:26:49,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +47: [2023-04-29 11:26:49,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +27: [2023-04-29 11:26:49,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +27: [2023-04-29 11:26:49,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +47: [2023-04-29 11:26:49,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +47: [2023-04-29 11:26:49,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +61: [2023-04-29 11:26:49,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 11:26:49,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 11:26:49,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +62: [2023-04-29 11:26:49,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 11:26:49,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 11:26:49,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 11:26:49,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 11:26:49,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 11:26:49,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 11:26:49,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 11:26:49,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +27: [2023-04-29 11:26:49,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +16: [2023-04-29 11:26:49,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 11:26:49,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +27: [2023-04-29 11:26:49,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 4: [2023-04-29 11:26:49,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +16: [2023-04-29 11:26:49,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +41: [2023-04-29 11:26:49,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +27: [2023-04-29 11:26:49,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +30: [2023-04-29 11:26:49,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 11:26:49,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +41: [2023-04-29 11:26:49,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +41: [2023-04-29 11:26:49,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +54: [2023-04-29 11:26:49,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +29: [2023-04-29 11:26:49,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +58: [2023-04-29 11:26:49,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +46: [2023-04-29 11:26:49,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +46: [2023-04-29 11:26:49,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +30: [2023-04-29 11:26:49,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +20: [2023-04-29 11:26:49,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +20: [2023-04-29 11:26:49,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +20: [2023-04-29 11:26:49,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +62: [2023-04-29 11:26:49,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 11:26:49,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +58: [2023-04-29 11:26:49,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +58: [2023-04-29 11:26:49,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 11:26:49,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +46: [2023-04-29 11:26:49,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +37: [2023-04-29 11:26:49,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +37: [2023-04-29 11:26:49,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +20: [2023-04-29 11:26:49,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +46: [2023-04-29 11:26:49,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +58: [2023-04-29 11:26:49,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +58: [2023-04-29 11:26:49,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +29: [2023-04-29 11:26:49,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +30: [2023-04-29 11:26:49,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 11:26:49,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +58: [2023-04-29 11:26:49,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 11:26:49,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +30: [2023-04-29 11:26:49,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +37: [2023-04-29 11:26:49,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +54: [2023-04-29 11:26:49,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +54: [2023-04-29 11:26:49,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +30: [2023-04-29 11:26:49,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +54: [2023-04-29 11:26:49,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +30: [2023-04-29 11:26:49,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +62: [2023-04-29 11:26:49,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +28: [2023-04-29 11:26:49,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +62: [2023-04-29 11:26:49,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +23: [2023-04-29 11:26:49,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 11:26:49,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 11:26:49,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 11:26:49,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +41: [2023-04-29 11:26:49,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:49,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +14: [2023-04-29 11:26:49,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +14: [2023-04-29 11:26:49,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 11:26:49,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 11:26:49,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 11:26:49,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +23: [2023-04-29 11:26:49,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 11:26:49,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +62: [2023-04-29 11:26:49,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +23: [2023-04-29 11:26:49,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 11:26:49,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 11:26:49,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 11:26:49,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 11:26:49,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 11:26:49,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +23: [2023-04-29 11:26:49,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 11:26:49,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 11:26:49,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +39: [2023-04-29 11:26:49,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +39: [2023-04-29 11:26:49,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... + 9: [2023-04-29 11:26:49,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 11:26:49,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +28: [2023-04-29 11:26:49,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +31: [2023-04-29 11:26:49,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +54: [2023-04-29 11:26:49,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +28: [2023-04-29 11:26:49,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +41: [2023-04-29 11:26:49,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 11:26:49,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 11:26:49,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 11:26:49,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +31: [2023-04-29 11:26:49,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +39: [2023-04-29 11:26:49,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 11:26:49,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 11:26:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 11:26:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 11:26:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +13: [2023-04-29 11:26:49,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +13: [2023-04-29 11:26:49,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +38: [2023-04-29 11:26:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 11:26:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 11:26:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +57: [2023-04-29 11:26:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +57: [2023-04-29 11:26:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +38: [2023-04-29 11:26:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 11:26:49,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +13: [2023-04-29 11:26:49,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +38: [2023-04-29 11:26:49,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 11:26:49,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +28: [2023-04-29 11:26:49,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 11:26:49,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 11:26:49,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +31: [2023-04-29 11:26:49,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +46: [2023-04-29 11:26:49,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 11:26:49,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 9: [2023-04-29 11:26:49,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +46: [2023-04-29 11:26:49,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 11:26:49,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +54: [2023-04-29 11:26:49,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +28: [2023-04-29 11:26:49,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +60: [2023-04-29 11:26:49,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +60: [2023-04-29 11:26:49,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 11:26:49,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 11:26:49,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 11:26:49,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 11:26:49,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 11:26:49,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 11:26:49,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 11:26:49,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 11:26:49,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +13: [2023-04-29 11:26:49,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +39: [2023-04-29 11:26:49,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +39: [2023-04-29 11:26:49,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +38: [2023-04-29 11:26:49,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +24: [2023-04-29 11:26:49,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +37: [2023-04-29 11:26:49,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 11:26:49,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 11:26:49,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +28: [2023-04-29 11:26:49,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +59: [2023-04-29 11:26:49,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +59: [2023-04-29 11:26:49,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +54: [2023-04-29 11:26:49,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 11:26:49,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +38: [2023-04-29 11:26:49,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 11:26:49,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 11:26:49,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +38: [2023-04-29 11:26:49,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +25: [2023-04-29 11:26:49,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +38: [2023-04-29 11:26:49,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +38: [2023-04-29 11:26:49,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +20: [2023-04-29 11:26:49,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +62: [2023-04-29 11:26:49,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +31: [2023-04-29 11:26:49,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +38: [2023-04-29 11:26:49,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +62: [2023-04-29 11:26:49,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +59: [2023-04-29 11:26:49,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +59: [2023-04-29 11:26:49,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +37: [2023-04-29 11:26:49,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +24: [2023-04-29 11:26:49,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +50: [2023-04-29 11:26:49,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +50: [2023-04-29 11:26:49,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +50: [2023-04-29 11:26:49,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +50: [2023-04-29 11:26:49,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +54: [2023-04-29 11:26:49,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +31: [2023-04-29 11:26:49,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +20: [2023-04-29 11:26:49,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,423] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 11:26:49,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +50: [2023-04-29 11:26:49,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 11:26:49,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 11:26:49,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +50: [2023-04-29 11:26:49,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +25: [2023-04-29 11:26:49,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +60: [2023-04-29 11:26:49,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 11:26:49,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 11:26:49,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +56: [2023-04-29 11:26:49,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +31: [2023-04-29 11:26:49,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +47: [2023-04-29 11:26:49,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +51: [2023-04-29 11:26:49,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +33: [2023-04-29 11:26:49,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +31: [2023-04-29 11:26:49,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +33: [2023-04-29 11:26:49,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +24: [2023-04-29 11:26:49,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +56: [2023-04-29 11:26:49,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +56: [2023-04-29 11:26:49,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. + 6: [2023-04-29 11:26:49,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +25: [2023-04-29 11:26:49,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +24: [2023-04-29 11:26:49,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +47: [2023-04-29 11:26:49,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +24: [2023-04-29 11:26:49,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 11:26:49,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +51: [2023-04-29 11:26:49,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +44: [2023-04-29 11:26:49,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +44: [2023-04-29 11:26:49,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +42: [2023-04-29 11:26:49,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 11:26:49,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +25: [2023-04-29 11:26:49,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +42: [2023-04-29 11:26:49,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 11:26:49,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 11:26:49,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 11:26:49,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 11:26:49,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 11:26:49,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +24: [2023-04-29 11:26:49,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +16: [2023-04-29 11:26:49,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +24: [2023-04-29 11:26:49,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +44: [2023-04-29 11:26:49,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +44: [2023-04-29 11:26:49,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +29: [2023-04-29 11:26:49,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +25: [2023-04-29 11:26:49,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +24: [2023-04-29 11:26:49,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +25: [2023-04-29 11:26:49,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +57: [2023-04-29 11:26:49,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 11:26:49,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +42: [2023-04-29 11:26:49,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +16: [2023-04-29 11:26:49,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +42: [2023-04-29 11:26:49,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +51: [2023-04-29 11:26:49,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 11:26:49,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 11:26:49,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 11:26:49,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +42: [2023-04-29 11:26:49,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 11:26:49,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 11:26:49,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +42: [2023-04-29 11:26:49,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +42: [2023-04-29 11:26:49,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +57: [2023-04-29 11:26:49,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 11:26:49,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 11:26:49,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 11:26:49,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 11:26:49,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 11:26:49,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 11:26:49,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +33: [2023-04-29 11:26:49,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +16: [2023-04-29 11:26:49,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 11:26:49,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +58: [2023-04-29 11:26:49,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 11:26:49,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 11:26:49,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +60: [2023-04-29 11:26:49,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +60: [2023-04-29 11:26:49,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +33: [2023-04-29 11:26:49,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 11:26:49,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +58: [2023-04-29 11:26:49,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 11:26:49,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +47: [2023-04-29 11:26:49,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +56: [2023-04-29 11:26:49,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +29: [2023-04-29 11:26:49,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +33: [2023-04-29 11:26:49,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 11:26:49,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 11:26:49,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 11:26:49,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 9: [2023-04-29 11:26:49,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +33: [2023-04-29 11:26:49,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 11:26:49,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 11:26:49,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 11:26:49,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 11:26:49,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +58: [2023-04-29 11:26:49,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +22: [2023-04-29 11:26:49,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +22: [2023-04-29 11:26:49,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +23: [2023-04-29 11:26:49,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +22: [2023-04-29 11:26:49,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +44: [2023-04-29 11:26:49,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:49,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 11:26:49,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +16: [2023-04-29 11:26:49,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +16: [2023-04-29 11:26:49,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +29: [2023-04-29 11:26:49,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +22: [2023-04-29 11:26:49,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +44: [2023-04-29 11:26:49,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +16: [2023-04-29 11:26:49,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 11:26:49,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +16: [2023-04-29 11:26:49,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 4: [2023-04-29 11:26:49,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +51: [2023-04-29 11:26:49,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 11:26:49,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:49,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +14: [2023-04-29 11:26:49,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 11:26:49,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +44: [2023-04-29 11:26:49,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 1: [2023-04-29 11:26:49,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +16: [2023-04-29 11:26:49,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +23: [2023-04-29 11:26:49,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +51: [2023-04-29 11:26:49,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +14: [2023-04-29 11:26:49,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 11:26:49,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 1: [2023-04-29 11:26:49,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +14: [2023-04-29 11:26:49,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +23: [2023-04-29 11:26:49,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 11:26:49,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +51: [2023-04-29 11:26:49,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +38: [2023-04-29 11:26:49,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 11:26:49,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +20: [2023-04-29 11:26:49,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +58: [2023-04-29 11:26:49,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 11:26:49,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:49,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 1: [2023-04-29 11:26:49,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +33: [2023-04-29 11:26:49,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +16: [2023-04-29 11:26:49,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 11:26:49,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +58: [2023-04-29 11:26:49,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +20: [2023-04-29 11:26:49,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +16: [2023-04-29 11:26:49,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 11:26:49,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +38: [2023-04-29 11:26:49,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 11:26:49,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +39: [2023-04-29 11:26:49,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 11:26:49,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 11:26:49,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 11:26:49,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +10: [2023-04-29 11:26:49,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 11:26:49,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 11:26:49,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 11:26:49,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 11:26:49,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 11:26:49,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 11:26:49,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 11:26:49,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +22: [2023-04-29 11:26:49,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +22: [2023-04-29 11:26:49,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 11:26:49,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 11:26:49,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +10: [2023-04-29 11:26:49,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 11:26:49,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 11:26:49,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 11:26:49,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 11:26:49,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +39: [2023-04-29 11:26:49,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 11:26:49,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 11:26:49,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 11:26:49,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 11:26:49,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 11:26:49,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 11:26:49,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 11:26:49,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +32: [2023-04-29 11:26:49,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +16: [2023-04-29 11:26:49,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +22: [2023-04-29 11:26:49,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 11:26:49,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +50: [2023-04-29 11:26:49,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +10: [2023-04-29 11:26:49,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 11:26:49,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +23: [2023-04-29 11:26:49,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 11:26:49,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +20: [2023-04-29 11:26:49,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 0: [2023-04-29 11:26:49,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +20: [2023-04-29 11:26:49,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +32: [2023-04-29 11:26:49,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +22: [2023-04-29 11:26:49,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +50: [2023-04-29 11:26:49,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 11:26:49,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +50: [2023-04-29 11:26:49,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +52: [2023-04-29 11:26:49,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +52: [2023-04-29 11:26:49,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +52: [2023-04-29 11:26:49,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. + 1: [2023-04-29 11:26:49,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +52: [2023-04-29 11:26:49,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +18: [2023-04-29 11:26:49,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 11:26:49,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 11:26:49,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 11:26:49,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +63: [2023-04-29 11:26:49,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 11:26:49,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +38: [2023-04-29 11:26:49,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +20: [2023-04-29 11:26:49,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +23: [2023-04-29 11:26:49,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +23: [2023-04-29 11:26:49,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +32: [2023-04-29 11:26:49,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... + 1: [2023-04-29 11:26:49,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 11:26:49,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +63: [2023-04-29 11:26:49,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 11:26:49,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 11:26:49,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +42: [2023-04-29 11:26:49,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +32: [2023-04-29 11:26:49,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +18: [2023-04-29 11:26:49,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +32: [2023-04-29 11:26:49,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +32: [2023-04-29 11:26:49,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +32: [2023-04-29 11:26:49,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +32: [2023-04-29 11:26:49,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +18: [2023-04-29 11:26:49,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 11:26:49,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +63: [2023-04-29 11:26:49,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +63: [2023-04-29 11:26:49,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +63: [2023-04-29 11:26:49,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +63: [2023-04-29 11:26:49,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +42: [2023-04-29 11:26:49,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +42: [2023-04-29 11:26:49,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +42: [2023-04-29 11:26:49,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +38: [2023-04-29 11:26:49,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 7: [2023-04-29 11:26:49,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 7: [2023-04-29 11:26:49,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 7: [2023-04-29 11:26:49,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 6: [2023-04-29 11:26:49,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 11:26:49,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 11:26:49,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +52: [2023-04-29 11:26:49,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 11:26:49,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 11:26:49,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 11:26:49,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +43: [2023-04-29 11:26:49,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 11:26:49,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +52: [2023-04-29 11:26:49,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 11:26:49,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +50: [2023-04-29 11:26:49,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +49: [2023-04-29 11:26:49,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 11:26:49,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 11:26:49,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 11:26:49,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +49: [2023-04-29 11:26:49,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 11:26:49,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 11:26:49,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 11:26:49,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +41: [2023-04-29 11:26:49,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +43: [2023-04-29 11:26:49,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 11:26:49,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +41: [2023-04-29 11:26:49,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +50: [2023-04-29 11:26:49,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 11:26:49,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +43: [2023-04-29 11:26:49,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 11:26:49,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +42: [2023-04-29 11:26:49,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +43: [2023-04-29 11:26:49,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 4: [2023-04-29 11:26:49,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 4: [2023-04-29 11:26:49,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 4: [2023-04-29 11:26:49,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +49: [2023-04-29 11:26:49,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 11:26:49,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +49: [2023-04-29 11:26:49,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +49: [2023-04-29 11:26:49,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +43: [2023-04-29 11:26:49,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 11:26:49,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +30: [2023-04-29 11:26:49,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +30: [2023-04-29 11:26:49,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +30: [2023-04-29 11:26:49,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +30: [2023-04-29 11:26:49,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +49: [2023-04-29 11:26:49,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +49: [2023-04-29 11:26:49,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 11:26:49,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +49: [2023-04-29 11:26:49,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +19: [2023-04-29 11:26:49,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +19: [2023-04-29 11:26:49,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +19: [2023-04-29 11:26:49,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +19: [2023-04-29 11:26:49,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +30: [2023-04-29 11:26:49,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +30: [2023-04-29 11:26:49,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +30: [2023-04-29 11:26:49,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +42: [2023-04-29 11:26:49,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 11:26:49,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 11:26:49,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 11:26:49,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 11:26:49,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +42: [2023-04-29 11:26:49,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +27: [2023-04-29 11:26:49,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:49,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 11:26:49,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 11:26:49,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 11:26:49,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +39: [2023-04-29 11:26:49,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 11:26:49,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +10: [2023-04-29 11:26:49,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 11:26:49,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 11:26:49,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 11:26:49,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +27: [2023-04-29 11:26:49,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 11:26:49,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 11:26:49,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 11:26:49,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +36: [2023-04-29 11:26:49,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 11:26:49,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 11:26:49,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 11:26:49,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 11:26:49,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 11:26:49,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 11:26:49,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 11:26:49,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +39: [2023-04-29 11:26:49,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 11:26:49,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 11:26:49,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 11:26:49,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 11:26:49,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +55: [2023-04-29 11:26:49,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 11:26:49,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 11:26:49,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 11:26:49,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 11:26:49,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +11: [2023-04-29 11:26:49,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +55: [2023-04-29 11:26:49,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 11:26:49,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 11:26:49,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +55: [2023-04-29 11:26:49,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 11:26:49,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 11:26:49,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +22: [2023-04-29 11:26:49,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +22: [2023-04-29 11:26:49,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 11:26:49,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +36: [2023-04-29 11:26:49,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +36: [2023-04-29 11:26:49,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +36: [2023-04-29 11:26:49,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +36: [2023-04-29 11:26:49,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +41: [2023-04-29 11:26:49,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +10: [2023-04-29 11:26:49,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 0: [2023-04-29 11:26:49,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +15: [2023-04-29 11:26:49,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +15: [2023-04-29 11:26:49,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +11: [2023-04-29 11:26:49,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +55: [2023-04-29 11:26:49,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +55: [2023-04-29 11:26:49,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +16: [2023-04-29 11:26:49,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +16: [2023-04-29 11:26:49,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +15: [2023-04-29 11:26:49,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +15: [2023-04-29 11:26:49,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +36: [2023-04-29 11:26:49,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +45: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +45: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +36: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +45: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +45: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +45: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +45: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +45: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +10: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +36: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +45: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 11:26:49,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 11:26:49,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +16: [2023-04-29 11:26:49,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +22: [2023-04-29 11:26:49,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +11: [2023-04-29 11:26:49,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 11:26:49,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 1: [2023-04-29 11:26:49,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 11:26:49,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 11:26:49,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +22: [2023-04-29 11:26:49,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +18: [2023-04-29 11:26:49,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 11:26:49,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +55: [2023-04-29 11:26:49,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 11:26:49,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 11:26:49,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 11:26:49,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 11:26:49,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +19: [2023-04-29 11:26:49,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +48: [2023-04-29 11:26:49,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 11:26:49,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 11:26:49,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 11:26:49,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +45: [2023-04-29 11:26:49,572] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 11:26:49,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +18: [2023-04-29 11:26:49,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +45: [2023-04-29 11:26:49,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +55: [2023-04-29 11:26:49,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +16: [2023-04-29 11:26:49,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +55: [2023-04-29 11:26:49,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +55: [2023-04-29 11:26:49,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +63: [2023-04-29 11:26:49,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 11:26:49,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +45: [2023-04-29 11:26:49,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +16: [2023-04-29 11:26:49,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +10: [2023-04-29 11:26:49,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +10: [2023-04-29 11:26:49,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +31: [2023-04-29 11:26:49,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 11:26:49,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 11:26:49,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 11:26:49,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +16: [2023-04-29 11:26:49,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +31: [2023-04-29 11:26:49,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 11:26:49,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +39: [2023-04-29 11:26:49,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +45: [2023-04-29 11:26:49,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +45: [2023-04-29 11:26:49,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +63: [2023-04-29 11:26:49,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +19: [2023-04-29 11:26:49,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 11:26:49,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 11:26:49,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +22: [2023-04-29 11:26:49,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +19: [2023-04-29 11:26:49,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +45: [2023-04-29 11:26:49,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... + 1: [2023-04-29 11:26:49,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +19: [2023-04-29 11:26:49,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +48: [2023-04-29 11:26:49,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +45: [2023-04-29 11:26:49,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 11:26:49,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 11:26:49,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +48: [2023-04-29 11:26:49,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +16: [2023-04-29 11:26:49,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +48: [2023-04-29 11:26:49,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +48: [2023-04-29 11:26:49,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 11:26:49,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 11:26:49,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +48: [2023-04-29 11:26:49,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +31: [2023-04-29 11:26:49,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 11:26:49,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 11:26:49,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +48: [2023-04-29 11:26:49,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +31: [2023-04-29 11:26:49,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +32: [2023-04-29 11:26:49,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 11:26:49,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 11:26:49,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +32: [2023-04-29 11:26:49,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 11:26:49,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 11:26:49,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 11:26:49,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +56: [2023-04-29 11:26:49,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 11:26:49,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 11:26:49,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 11:26:49,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 11:26:49,585] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +22: [2023-04-29 11:26:49,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +35: [2023-04-29 11:26:49,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +35: [2023-04-29 11:26:49,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +35: [2023-04-29 11:26:49,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +35: [2023-04-29 11:26:49,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 11:26:49,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 11:26:49,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +35: [2023-04-29 11:26:49,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +35: [2023-04-29 11:26:49,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +63: [2023-04-29 11:26:49,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 11:26:49,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +30: [2023-04-29 11:26:49,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +56: [2023-04-29 11:26:49,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +10: [2023-04-29 11:26:49,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +56: [2023-04-29 11:26:49,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +56: [2023-04-29 11:26:49,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +39: [2023-04-29 11:26:49,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 11:26:49,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +39: [2023-04-29 11:26:49,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 11:26:49,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 11:26:49,591] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +43: [2023-04-29 11:26:49,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +25: [2023-04-29 11:26:49,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 11:26:49,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +56: [2023-04-29 11:26:49,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +15: [2023-04-29 11:26:49,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 11:26:49,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... + 3: [2023-04-29 11:26:49,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +18: [2023-04-29 11:26:49,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +25: [2023-04-29 11:26:49,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +35: [2023-04-29 11:26:49,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +35: [2023-04-29 11:26:49,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +25: [2023-04-29 11:26:49,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +56: [2023-04-29 11:26:49,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +35: [2023-04-29 11:26:49,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +35: [2023-04-29 11:26:49,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +28: [2023-04-29 11:26:49,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 11:26:49,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 11:26:49,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 11:26:49,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +35: [2023-04-29 11:26:49,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +28: [2023-04-29 11:26:49,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +35: [2023-04-29 11:26:49,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 11:26:49,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +35: [2023-04-29 11:26:49,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt... +35: [2023-04-29 11:26:49,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt... +49: [2023-04-29 11:26:49,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 11:26:49,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +63: [2023-04-29 11:26:49,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +15: [2023-04-29 11:26:49,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 11:26:49,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 11:26:49,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +21: [2023-04-29 11:26:49,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +21: [2023-04-29 11:26:49,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +18: [2023-04-29 11:26:49,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +21: [2023-04-29 11:26:49,601] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +25: [2023-04-29 11:26:49,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +43: [2023-04-29 11:26:49,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +28: [2023-04-29 11:26:49,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 11:26:49,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +63: [2023-04-29 11:26:49,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +15: [2023-04-29 11:26:49,603] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +43: [2023-04-29 11:26:49,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +28: [2023-04-29 11:26:49,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 3: [2023-04-29 11:26:49,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +10: [2023-04-29 11:26:49,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +10: [2023-04-29 11:26:49,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +28: [2023-04-29 11:26:49,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +43: [2023-04-29 11:26:49,605] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 11:26:49,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +63: [2023-04-29 11:26:49,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +27: [2023-04-29 11:26:49,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 11:26:49,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 11:26:49,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 11:26:49,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +47: [2023-04-29 11:26:49,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +19: [2023-04-29 11:26:49,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 11:26:49,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 11:26:49,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 11:26:49,611] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +47: [2023-04-29 11:26:49,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +47: [2023-04-29 11:26:49,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +18: [2023-04-29 11:26:49,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 7: [2023-04-29 11:26:49,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +18: [2023-04-29 11:26:49,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +12: [2023-04-29 11:26:49,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 11:26:49,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +18: [2023-04-29 11:26:49,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +18: [2023-04-29 11:26:49,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 11:26:49,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +63: [2023-04-29 11:26:49,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +19: [2023-04-29 11:26:49,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 11:26:49,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +49: [2023-04-29 11:26:49,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 11:26:49,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +10: [2023-04-29 11:26:49,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 11:26:49,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 11:26:49,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +20: [2023-04-29 11:26:49,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +20: [2023-04-29 11:26:49,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +20: [2023-04-29 11:26:49,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 11:26:49,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +19: [2023-04-29 11:26:49,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +21: [2023-04-29 11:26:49,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +21: [2023-04-29 11:26:49,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 11:26:49,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +21: [2023-04-29 11:26:49,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +21: [2023-04-29 11:26:49,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +43: [2023-04-29 11:26:49,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 11:26:49,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +63: [2023-04-29 11:26:49,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. + 7: [2023-04-29 11:26:49,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +32: [2023-04-29 11:26:49,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +30: [2023-04-29 11:26:49,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +30: [2023-04-29 11:26:49,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +30: [2023-04-29 11:26:49,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 2: [2023-04-29 11:26:49,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 2: [2023-04-29 11:26:49,619] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. + 2: [2023-04-29 11:26:49,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +63: [2023-04-29 11:26:49,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +63: [2023-04-29 11:26:49,620] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +20: [2023-04-29 11:26:49,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +20: [2023-04-29 11:26:49,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +32: [2023-04-29 11:26:49,621] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 11:26:49,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 11:26:49,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +32: [2023-04-29 11:26:49,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +21: [2023-04-29 11:26:49,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +32: [2023-04-29 11:26:49,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,622] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +21: [2023-04-29 11:26:49,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +20: [2023-04-29 11:26:49,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 11:26:49,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +20: [2023-04-29 11:26:49,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 11:26:49,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +49: [2023-04-29 11:26:49,624] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 11:26:49,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,625] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 11:26:49,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 11:26:49,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 11:26:49,626] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +11: [2023-04-29 11:26:49,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 11:26:49,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +22: [2023-04-29 11:26:49,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +22: [2023-04-29 11:26:49,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +55: [2023-04-29 11:26:49,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +22: [2023-04-29 11:26:49,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +59: [2023-04-29 11:26:49,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 11:26:49,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +12: [2023-04-29 11:26:49,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +55: [2023-04-29 11:26:49,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 11:26:49,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +19: [2023-04-29 11:26:49,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +59: [2023-04-29 11:26:49,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 11:26:49,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 11:26:49,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +21: [2023-04-29 11:26:49,632] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +59: [2023-04-29 11:26:49,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +45: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... + 4: [2023-04-29 11:26:49,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 11:26:49,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 11:26:49,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +43: [2023-04-29 11:26:49,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:49,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:49,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 11:26:49,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 11:26:49,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 11:26:49,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +63: [2023-04-29 11:26:49,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +63: [2023-04-29 11:26:49,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +19: [2023-04-29 11:26:49,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +21: [2023-04-29 11:26:49,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +22: [2023-04-29 11:26:49,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +36: [2023-04-29 11:26:49,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 11:26:49,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +36: [2023-04-29 11:26:49,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +22: [2023-04-29 11:26:49,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 11:26:49,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +59: [2023-04-29 11:26:49,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 11:26:49,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +27: [2023-04-29 11:26:49,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +47: [2023-04-29 11:26:49,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 11:26:49,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... + 3: [2023-04-29 11:26:49,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 11:26:49,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +59: [2023-04-29 11:26:49,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +46: [2023-04-29 11:26:49,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +46: [2023-04-29 11:26:49,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +46: [2023-04-29 11:26:49,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 11:26:49,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +59: [2023-04-29 11:26:49,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +22: [2023-04-29 11:26:49,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +46: [2023-04-29 11:26:49,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +12: [2023-04-29 11:26:49,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +46: [2023-04-29 11:26:49,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +47: [2023-04-29 11:26:49,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +30: [2023-04-29 11:26:49,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +46: [2023-04-29 11:26:49,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +46: [2023-04-29 11:26:49,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +59: [2023-04-29 11:26:49,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +18: [2023-04-29 11:26:49,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +45: [2023-04-29 11:26:49,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 11:26:49,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 11:26:49,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +11: [2023-04-29 11:26:49,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 11:26:49,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 11:26:49,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +48: [2023-04-29 11:26:49,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 11:26:49,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 11:26:49,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +17: [2023-04-29 11:26:49,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +17: [2023-04-29 11:26:49,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +18: [2023-04-29 11:26:49,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +18: [2023-04-29 11:26:49,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 11:26:49,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +30: [2023-04-29 11:26:49,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +45: [2023-04-29 11:26:49,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 11:26:49,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +48: [2023-04-29 11:26:49,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +49: [2023-04-29 11:26:49,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 11:26:49,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 11:26:49,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 11:26:49,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +62: [2023-04-29 11:26:49,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +62: [2023-04-29 11:26:49,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +49: [2023-04-29 11:26:49,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +49: [2023-04-29 11:26:49,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +11: [2023-04-29 11:26:49,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +36: [2023-04-29 11:26:49,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +31: [2023-04-29 11:26:49,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 11:26:49,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 11:26:49,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +48: [2023-04-29 11:26:49,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 11:26:49,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +12: [2023-04-29 11:26:49,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,650] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +17: [2023-04-29 11:26:49,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +51: [2023-04-29 11:26:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +51: [2023-04-29 11:26:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +17: [2023-04-29 11:26:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +51: [2023-04-29 11:26:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +25: [2023-04-29 11:26:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +51: [2023-04-29 11:26:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. + 4: [2023-04-29 11:26:49,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +31: [2023-04-29 11:26:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +57: [2023-04-29 11:26:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 11:26:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 11:26:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +57: [2023-04-29 11:26:49,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 11:26:49,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +62: [2023-04-29 11:26:49,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +57: [2023-04-29 11:26:49,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 11:26:49,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 11:26:49,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +55: [2023-04-29 11:26:49,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +57: [2023-04-29 11:26:49,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +18: [2023-04-29 11:26:49,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +27: [2023-04-29 11:26:49,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +34: [2023-04-29 11:26:49,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 11:26:49,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 11:26:49,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 11:26:49,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 11:26:49,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 11:26:49,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 11:26:49,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 11:26:49,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +19: [2023-04-29 11:26:49,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +19: [2023-04-29 11:26:49,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +56: [2023-04-29 11:26:49,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +29: [2023-04-29 11:26:49,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 11:26:49,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 11:26:49,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +55: [2023-04-29 11:26:49,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +15: [2023-04-29 11:26:49,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +57: [2023-04-29 11:26:49,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +57: [2023-04-29 11:26:49,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +57: [2023-04-29 11:26:49,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +57: [2023-04-29 11:26:49,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +57: [2023-04-29 11:26:49,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +27: [2023-04-29 11:26:49,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 11:26:49,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 11:26:49,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +57: [2023-04-29 11:26:49,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +27: [2023-04-29 11:26:49,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +53: [2023-04-29 11:26:49,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +53: [2023-04-29 11:26:49,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +45: [2023-04-29 11:26:49,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 11:26:49,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +43: [2023-04-29 11:26:49,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +43: [2023-04-29 11:26:49,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +43: [2023-04-29 11:26:49,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +57: [2023-04-29 11:26:49,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +57: [2023-04-29 11:26:49,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 11:26:49,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 11:26:49,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +50: [2023-04-29 11:26:49,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +50: [2023-04-29 11:26:49,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +50: [2023-04-29 11:26:49,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +50: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +54: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +54: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +53: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +53: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +53: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +53: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +53: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +29: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +56: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +53: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +42: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +34: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +34: [2023-04-29 11:26:49,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +29: [2023-04-29 11:26:49,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 11:26:49,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +56: [2023-04-29 11:26:49,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +29: [2023-04-29 11:26:49,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 11:26:49,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 11:26:49,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +17: [2023-04-29 11:26:49,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +35: [2023-04-29 11:26:49,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +15: [2023-04-29 11:26:49,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +28: [2023-04-29 11:26:49,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +42: [2023-04-29 11:26:49,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +25: [2023-04-29 11:26:49,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +42: [2023-04-29 11:26:49,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +34: [2023-04-29 11:26:49,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +26: [2023-04-29 11:26:49,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +26: [2023-04-29 11:26:49,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +54: [2023-04-29 11:26:49,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +54: [2023-04-29 11:26:49,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +34: [2023-04-29 11:26:49,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +55: [2023-04-29 11:26:49,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 11:26:49,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +55: [2023-04-29 11:26:49,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +17: [2023-04-29 11:26:49,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +13: [2023-04-29 11:26:49,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 11:26:49,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +13: [2023-04-29 11:26:49,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +13: [2023-04-29 11:26:49,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +13: [2023-04-29 11:26:49,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +36: [2023-04-29 11:26:49,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 11:26:49,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +53: [2023-04-29 11:26:49,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +53: [2023-04-29 11:26:49,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +53: [2023-04-29 11:26:49,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 11:26:49,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 11:26:49,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +15: [2023-04-29 11:26:49,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 11:26:49,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +34: [2023-04-29 11:26:49,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +34: [2023-04-29 11:26:49,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 11:26:49,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +17: [2023-04-29 11:26:49,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +53: [2023-04-29 11:26:49,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +34: [2023-04-29 11:26:49,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +45: [2023-04-29 11:26:49,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 11:26:49,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +10: [2023-04-29 11:26:49,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 11:26:49,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 11:26:49,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 11:26:49,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 11:26:49,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 11:26:49,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +35: [2023-04-29 11:26:49,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +17: [2023-04-29 11:26:49,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +24: [2023-04-29 11:26:49,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 11:26:49,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 11:26:49,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 11:26:49,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +26: [2023-04-29 11:26:49,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +26: [2023-04-29 11:26:49,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_16-model_01-model_states.pt. +35: [2023-04-29 11:26:49,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +35: [2023-04-29 11:26:49,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_00-model_states.pt. +17: [2023-04-29 11:26:49,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +17: [2023-04-29 11:26:49,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 11:26:49,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 11:26:49,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 11:26:49,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 11:26:49,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 11:26:49,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +17: [2023-04-29 11:26:49,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +17: [2023-04-29 11:26:49,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +48: [2023-04-29 11:26:49,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 11:26:49,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 11:26:49,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +15: [2023-04-29 11:26:49,674] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +44: [2023-04-29 11:26:49,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +56: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +11: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +44: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +25: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +17: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +24: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +17: [2023-04-29 11:26:49,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 11:26:49,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +48: [2023-04-29 11:26:49,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +15: [2023-04-29 11:26:49,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +24: [2023-04-29 11:26:49,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +45: [2023-04-29 11:26:49,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +17: [2023-04-29 11:26:49,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 11:26:49,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 11:26:49,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +62: [2023-04-29 11:26:49,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +15: [2023-04-29 11:26:49,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 11:26:49,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +48: [2023-04-29 11:26:49,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +11: [2023-04-29 11:26:49,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 11:26:49,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 11:26:49,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +31: [2023-04-29 11:26:49,679] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +31: [2023-04-29 11:26:49,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +25: [2023-04-29 11:26:49,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +44: [2023-04-29 11:26:49,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 11:26:49,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 11:26:49,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 11:26:49,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +44: [2023-04-29 11:26:49,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +44: [2023-04-29 11:26:49,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +44: [2023-04-29 11:26:49,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 11:26:49,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +19: [2023-04-29 11:26:49,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 11:26:49,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +48: [2023-04-29 11:26:49,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +31: [2023-04-29 11:26:49,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +62: [2023-04-29 11:26:49,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 11:26:49,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 11:26:49,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +44: [2023-04-29 11:26:49,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +44: [2023-04-29 11:26:49,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +44: [2023-04-29 11:26:49,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +15: [2023-04-29 11:26:49,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +37: [2023-04-29 11:26:49,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 11:26:49,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 11:26:49,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 11:26:49,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +37: [2023-04-29 11:26:49,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +37: [2023-04-29 11:26:49,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 11:26:49,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 11:26:49,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +37: [2023-04-29 11:26:49,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +28: [2023-04-29 11:26:49,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 11:26:49,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +43: [2023-04-29 11:26:49,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 11:26:49,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 11:26:49,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +25: [2023-04-29 11:26:49,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +43: [2023-04-29 11:26:49,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +10: [2023-04-29 11:26:49,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 11:26:49,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 11:26:49,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 11:26:49,689] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +56: [2023-04-29 11:26:49,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 11:26:49,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +50: [2023-04-29 11:26:49,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +21: [2023-04-29 11:26:49,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +21: [2023-04-29 11:26:49,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +54: [2023-04-29 11:26:49,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +54: [2023-04-29 11:26:49,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 11:26:49,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +37: [2023-04-29 11:26:49,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 11:26:49,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +54: [2023-04-29 11:26:49,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +25: [2023-04-29 11:26:49,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +37: [2023-04-29 11:26:49,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +20: [2023-04-29 11:26:49,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +37: [2023-04-29 11:26:49,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... + 8: [2023-04-29 11:26:49,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 11:26:49,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 8: [2023-04-29 11:26:49,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +22: [2023-04-29 11:26:49,693] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +54: [2023-04-29 11:26:49,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +50: [2023-04-29 11:26:49,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 11:26:49,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 11:26:49,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 11:26:49,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +21: [2023-04-29 11:26:49,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +21: [2023-04-29 11:26:49,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +21: [2023-04-29 11:26:49,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +42: [2023-04-29 11:26:49,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 11:26:49,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +21: [2023-04-29 11:26:49,695] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +35: [2023-04-29 11:26:49,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 11:26:49,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +26: [2023-04-29 11:26:49,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +26: [2023-04-29 11:26:49,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +10: [2023-04-29 11:26:49,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +37: [2023-04-29 11:26:49,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... + 7: [2023-04-29 11:26:49,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 11:26:49,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 11:26:49,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +37: [2023-04-29 11:26:49,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +26: [2023-04-29 11:26:49,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +37: [2023-04-29 11:26:49,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +37: [2023-04-29 11:26:49,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +10: [2023-04-29 11:26:49,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +37: [2023-04-29 11:26:49,698] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 11:26:49,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 11:26:49,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 11:26:49,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 11:26:49,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 11:26:49,699] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 11:26:49,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 11:26:49,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 11:26:49,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +40: [2023-04-29 11:26:49,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 11:26:49,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +46: [2023-04-29 11:26:49,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 11:26:49,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 11:26:49,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +28: [2023-04-29 11:26:49,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +63: [2023-04-29 11:26:49,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +40: [2023-04-29 11:26:49,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +40: [2023-04-29 11:26:49,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +35: [2023-04-29 11:26:49,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +35: [2023-04-29 11:26:49,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 11:26:49,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +63: [2023-04-29 11:26:49,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 11:26:49,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 11:26:49,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +40: [2023-04-29 11:26:49,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +19: [2023-04-29 11:26:49,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +35: [2023-04-29 11:26:49,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +22: [2023-04-29 11:26:49,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +22: [2023-04-29 11:26:49,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +40: [2023-04-29 11:26:49,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... + 3: [2023-04-29 11:26:49,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +46: [2023-04-29 11:26:49,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 11:26:49,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +22: [2023-04-29 11:26:49,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 11:26:49,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 11:26:49,708] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt... +40: [2023-04-29 11:26:49,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +40: [2023-04-29 11:26:49,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +63: [2023-04-29 11:26:49,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +21: [2023-04-29 11:26:49,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 11:26:49,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 11:26:49,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +46: [2023-04-29 11:26:49,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 11:26:49,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 11:26:49,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +52: [2023-04-29 11:26:49,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 11:26:49,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 6: [2023-04-29 11:26:49,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 6: [2023-04-29 11:26:49,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +19: [2023-04-29 11:26:49,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 3: [2023-04-29 11:26:49,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 11:26:49,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +63: [2023-04-29 11:26:49,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +52: [2023-04-29 11:26:49,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 11:26:49,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 11:26:49,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 11:26:49,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 11:26:49,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 11:26:49,714] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +52: [2023-04-29 11:26:49,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +46: [2023-04-29 11:26:49,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +18: [2023-04-29 11:26:49,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 11:26:49,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 11:26:49,716] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +63: [2023-04-29 11:26:49,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +18: [2023-04-29 11:26:49,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +57: [2023-04-29 11:26:49,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +23: [2023-04-29 11:26:49,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +23: [2023-04-29 11:26:49,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +23: [2023-04-29 11:26:49,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 2: [2023-04-29 11:26:49,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +21: [2023-04-29 11:26:49,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +23: [2023-04-29 11:26:49,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +29: [2023-04-29 11:26:49,718] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +21: [2023-04-29 11:26:49,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +52: [2023-04-29 11:26:49,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 11:26:49,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +52: [2023-04-29 11:26:49,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +52: [2023-04-29 11:26:49,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +21: [2023-04-29 11:26:49,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +59: [2023-04-29 11:26:49,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +59: [2023-04-29 11:26:49,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 11:26:49,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +22: [2023-04-29 11:26:49,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +52: [2023-04-29 11:26:49,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 3: [2023-04-29 11:26:49,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +52: [2023-04-29 11:26:49,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +20: [2023-04-29 11:26:49,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 11:26:49,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +12: [2023-04-29 11:26:49,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +18: [2023-04-29 11:26:49,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +61: [2023-04-29 11:26:49,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 11:26:49,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 11:26:49,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +59: [2023-04-29 11:26:49,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 11:26:49,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 11:26:49,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 11:26:49,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 11:26:49,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 11:26:49,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 11:26:49,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +29: [2023-04-29 11:26:49,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +21: [2023-04-29 11:26:49,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +33: [2023-04-29 11:26:49,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +33: [2023-04-29 11:26:49,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +63: [2023-04-29 11:26:49,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +12: [2023-04-29 11:26:49,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +12: [2023-04-29 11:26:49,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +34: [2023-04-29 11:26:49,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +18: [2023-04-29 11:26:49,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +57: [2023-04-29 11:26:49,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +21: [2023-04-29 11:26:49,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +21: [2023-04-29 11:26:49,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +33: [2023-04-29 11:26:49,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +14: [2023-04-29 11:26:49,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +14: [2023-04-29 11:26:49,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 11:26:49,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +46: [2023-04-29 11:26:49,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 11:26:49,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +34: [2023-04-29 11:26:49,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 11:26:49,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 3: [2023-04-29 11:26:49,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +61: [2023-04-29 11:26:49,728] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 11:26:49,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +20: [2023-04-29 11:26:49,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +61: [2023-04-29 11:26:49,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +14: [2023-04-29 11:26:49,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +61: [2023-04-29 11:26:49,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +44: [2023-04-29 11:26:49,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +14: [2023-04-29 11:26:49,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +61: [2023-04-29 11:26:49,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +61: [2023-04-29 11:26:49,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +18: [2023-04-29 11:26:49,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +61: [2023-04-29 11:26:49,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +41: [2023-04-29 11:26:49,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 11:26:49,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 11:26:49,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +53: [2023-04-29 11:26:49,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +53: [2023-04-29 11:26:49,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +14: [2023-04-29 11:26:49,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +46: [2023-04-29 11:26:49,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 11:26:49,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 11:26:49,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 11:26:49,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 11:26:49,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 11:26:49,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 11:26:49,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +57: [2023-04-29 11:26:49,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +59: [2023-04-29 11:26:49,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +14: [2023-04-29 11:26:49,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 11:26:49,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +13: [2023-04-29 11:26:49,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +41: [2023-04-29 11:26:49,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +17: [2023-04-29 11:26:49,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +53: [2023-04-29 11:26:49,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +53: [2023-04-29 11:26:49,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 11:26:49,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:49,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 11:26:49,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 11:26:49,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +41: [2023-04-29 11:26:49,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 11:26:49,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 11:26:49,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +15: [2023-04-29 11:26:49,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 11:26:49,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 11:26:49,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +46: [2023-04-29 11:26:49,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +17: [2023-04-29 11:26:49,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +41: [2023-04-29 11:26:49,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +41: [2023-04-29 11:26:49,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +41: [2023-04-29 11:26:49,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... + 6: [2023-04-29 11:26:49,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 11:26:49,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +13: [2023-04-29 11:26:49,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +13: [2023-04-29 11:26:49,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +46: [2023-04-29 11:26:49,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +24: [2023-04-29 11:26:49,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 11:26:49,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +22: [2023-04-29 11:26:49,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 11:26:49,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 8: [2023-04-29 11:26:49,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 8: [2023-04-29 11:26:49,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 8: [2023-04-29 11:26:49,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 5: [2023-04-29 11:26:49,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 11:26:49,745] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 11:26:49,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +17: [2023-04-29 11:26:49,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +57: [2023-04-29 11:26:49,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 11:26:49,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +23: [2023-04-29 11:26:49,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +23: [2023-04-29 11:26:49,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +23: [2023-04-29 11:26:49,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +12: [2023-04-29 11:26:49,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +26: [2023-04-29 11:26:49,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +26: [2023-04-29 11:26:49,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 11:26:49,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 11:26:49,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +44: [2023-04-29 11:26:49,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 11:26:49,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +34: [2023-04-29 11:26:49,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +29: [2023-04-29 11:26:49,749] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 11:26:49,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 11:26:49,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 11:26:49,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 11:26:49,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 11:26:49,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +44: [2023-04-29 11:26:49,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +22: [2023-04-29 11:26:49,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 11:26:49,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 11:26:49,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 11:26:49,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 11:26:49,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 11:26:49,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +33: [2023-04-29 11:26:49,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 11:26:49,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +12: [2023-04-29 11:26:49,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +44: [2023-04-29 11:26:49,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 11:26:49,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +59: [2023-04-29 11:26:49,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 11:26:49,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +59: [2023-04-29 11:26:49,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +17: [2023-04-29 11:26:49,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +40: [2023-04-29 11:26:49,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 11:26:49,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +15: [2023-04-29 11:26:49,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 11:26:49,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 11:26:49,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +34: [2023-04-29 11:26:49,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 11:26:49,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 11:26:49,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +33: [2023-04-29 11:26:49,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +34: [2023-04-29 11:26:49,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 11:26:49,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 11:26:49,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 11:26:49,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +59: [2023-04-29 11:26:49,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +37: [2023-04-29 11:26:49,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +16: [2023-04-29 11:26:49,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 11:26:49,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +33: [2023-04-29 11:26:49,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +17: [2023-04-29 11:26:49,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +43: [2023-04-29 11:26:49,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 11:26:49,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +16: [2023-04-29 11:26:49,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +57: [2023-04-29 11:26:49,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 11:26:49,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 11:26:49,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 11:26:49,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +43: [2023-04-29 11:26:49,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +37: [2023-04-29 11:26:49,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +43: [2023-04-29 11:26:49,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 11:26:49,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +57: [2023-04-29 11:26:49,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 11:26:49,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +13: [2023-04-29 11:26:49,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +53: [2023-04-29 11:26:49,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 11:26:49,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +37: [2023-04-29 11:26:49,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +37: [2023-04-29 11:26:49,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +26: [2023-04-29 11:26:49,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +26: [2023-04-29 11:26:49,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +29: [2023-04-29 11:26:49,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +43: [2023-04-29 11:26:49,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +43: [2023-04-29 11:26:49,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +40: [2023-04-29 11:26:49,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +15: [2023-04-29 11:26:49,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 11:26:49,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +33: [2023-04-29 11:26:49,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 11:26:49,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +17: [2023-04-29 11:26:49,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +33: [2023-04-29 11:26:49,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 11:26:49,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +24: [2023-04-29 11:26:49,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 11:26:49,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +26: [2023-04-29 11:26:49,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +17: [2023-04-29 11:26:49,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 11:26:49,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 11:26:49,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +33: [2023-04-29 11:26:49,772] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +24: [2023-04-29 11:26:49,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 11:26:49,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +11: [2023-04-29 11:26:49,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +11: [2023-04-29 11:26:49,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +11: [2023-04-29 11:26:49,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +13: [2023-04-29 11:26:49,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +52: [2023-04-29 11:26:49,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +13: [2023-04-29 11:26:49,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 11:26:49,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +33: [2023-04-29 11:26:49,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 11:26:49,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 11:26:49,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +34: [2023-04-29 11:26:49,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +24: [2023-04-29 11:26:49,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +34: [2023-04-29 11:26:49,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 11:26:49,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 11:26:49,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 11:26:49,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 11:26:49,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 11:26:49,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 11:26:49,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 11:26:49,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +24: [2023-04-29 11:26:49,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 11:26:49,779] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +62: [2023-04-29 11:26:49,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 11:26:49,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +44: [2023-04-29 11:26:49,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 11:26:49,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +40: [2023-04-29 11:26:49,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 11:26:49,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +17: [2023-04-29 11:26:49,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 11:26:49,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +37: [2023-04-29 11:26:49,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 11:26:49,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +62: [2023-04-29 11:26:49,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 11:26:49,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +26: [2023-04-29 11:26:49,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_00-model_states.pt. +62: [2023-04-29 11:26:49,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 11:26:49,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 11:26:49,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +38: [2023-04-29 11:26:49,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +62: [2023-04-29 11:26:49,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +38: [2023-04-29 11:26:49,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +38: [2023-04-29 11:26:49,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +26: [2023-04-29 11:26:49,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +62: [2023-04-29 11:26:49,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +62: [2023-04-29 11:26:49,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 7: [2023-04-29 11:26:49,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 11:26:49,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +62: [2023-04-29 11:26:49,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +37: [2023-04-29 11:26:49,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 11:26:49,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 11:26:49,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 11:26:49,790] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +14: [2023-04-29 11:26:49,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +61: [2023-04-29 11:26:49,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +37: [2023-04-29 11:26:49,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +61: [2023-04-29 11:26:49,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +26: [2023-04-29 11:26:49,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt... +37: [2023-04-29 11:26:49,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 11:26:49,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 11:26:49,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +61: [2023-04-29 11:26:49,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +14: [2023-04-29 11:26:49,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +41: [2023-04-29 11:26:49,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +41: [2023-04-29 11:26:49,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +11: [2023-04-29 11:26:49,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +41: [2023-04-29 11:26:49,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +52: [2023-04-29 11:26:49,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 11:26:49,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +47: [2023-04-29 11:26:49,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 11:26:49,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 11:26:49,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 11:26:49,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 11:26:49,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 11:26:49,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 11:26:49,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 11:26:49,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +40: [2023-04-29 11:26:49,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 11:26:49,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 11:26:49,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +23: [2023-04-29 11:26:49,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +40: [2023-04-29 11:26:49,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 6: [2023-04-29 11:26:49,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +47: [2023-04-29 11:26:49,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +47: [2023-04-29 11:26:49,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +47: [2023-04-29 11:26:49,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +47: [2023-04-29 11:26:49,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +38: [2023-04-29 11:26:49,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 7: [2023-04-29 11:26:49,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +14: [2023-04-29 11:26:49,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +11: [2023-04-29 11:26:49,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 11:26:49,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +12: [2023-04-29 11:26:49,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +38: [2023-04-29 11:26:49,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 11:26:49,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 11:26:49,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 11:26:49,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 11:26:49,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:49,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +52: [2023-04-29 11:26:49,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 11:26:49,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +14: [2023-04-29 11:26:49,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +14: [2023-04-29 11:26:49,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +42: [2023-04-29 11:26:49,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 11:26:49,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 11:26:49,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 11:26:49,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 11:26:49,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 11:26:49,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 11:26:49,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +14: [2023-04-29 11:26:49,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +42: [2023-04-29 11:26:49,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +47: [2023-04-29 11:26:49,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +23: [2023-04-29 11:26:49,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +23: [2023-04-29 11:26:49,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +11: [2023-04-29 11:26:49,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +47: [2023-04-29 11:26:49,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +14: [2023-04-29 11:26:49,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 6: [2023-04-29 11:26:49,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +16: [2023-04-29 11:26:49,818] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 11:26:49,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +23: [2023-04-29 11:26:49,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +33: [2023-04-29 11:26:49,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +11: [2023-04-29 11:26:49,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 11:26:49,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +35: [2023-04-29 11:26:49,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +35: [2023-04-29 11:26:49,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +35: [2023-04-29 11:26:49,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_39-model_01-model_states.pt. +14: [2023-04-29 11:26:49,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 11:26:49,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +30: [2023-04-29 11:26:49,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +12: [2023-04-29 11:26:49,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +12: [2023-04-29 11:26:49,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 11:26:49,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +30: [2023-04-29 11:26:49,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +12: [2023-04-29 11:26:49,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +50: [2023-04-29 11:26:49,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 11:26:49,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 11:26:49,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 11:26:49,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 11:26:49,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 11:26:49,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 11:26:49,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 11:26:49,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 11:26:49,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +42: [2023-04-29 11:26:49,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +42: [2023-04-29 11:26:49,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +23: [2023-04-29 11:26:49,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +23: [2023-04-29 11:26:49,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +42: [2023-04-29 11:26:49,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... + 5: [2023-04-29 11:26:49,824] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +42: [2023-04-29 11:26:49,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 11:26:49,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +16: [2023-04-29 11:26:49,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +61: [2023-04-29 11:26:49,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 11:26:49,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +26: [2023-04-29 11:26:49,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +26: [2023-04-29 11:26:49,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +42: [2023-04-29 11:26:49,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +42: [2023-04-29 11:26:49,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +42: [2023-04-29 11:26:49,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 11:26:49,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +61: [2023-04-29 11:26:49,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 11:26:49,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +41: [2023-04-29 11:26:49,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +50: [2023-04-29 11:26:49,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +14: [2023-04-29 11:26:49,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 11:26:49,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +41: [2023-04-29 11:26:49,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 11:26:49,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 11:26:49,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 11:26:49,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:49,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +50: [2023-04-29 11:26:49,829] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... + 8: [2023-04-29 11:26:49,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +50: [2023-04-29 11:26:49,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +50: [2023-04-29 11:26:49,830] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +41: [2023-04-29 11:26:49,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +50: [2023-04-29 11:26:49,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +50: [2023-04-29 11:26:49,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +61: [2023-04-29 11:26:49,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 11:26:49,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +41: [2023-04-29 11:26:49,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 11:26:49,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +27: [2023-04-29 11:26:49,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +50: [2023-04-29 11:26:49,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +27: [2023-04-29 11:26:49,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +16: [2023-04-29 11:26:49,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 11:26:49,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +24: [2023-04-29 11:26:49,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +24: [2023-04-29 11:26:49,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +24: [2023-04-29 11:26:49,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +24: [2023-04-29 11:26:49,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +33: [2023-04-29 11:26:49,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +33: [2023-04-29 11:26:49,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 11:26:49,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 11:26:49,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +60: [2023-04-29 11:26:49,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. + 5: [2023-04-29 11:26:49,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 11:26:49,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +39: [2023-04-29 11:26:49,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +39: [2023-04-29 11:26:49,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +51: [2023-04-29 11:26:49,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 11:26:49,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 11:26:49,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 11:26:49,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 11:26:49,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 11:26:49,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 11:26:49,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 11:26:49,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 11:26:49,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +39: [2023-04-29 11:26:49,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +33: [2023-04-29 11:26:49,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 11:26:49,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +60: [2023-04-29 11:26:49,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +14: [2023-04-29 11:26:49,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +33: [2023-04-29 11:26:49,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 11:26:49,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +51: [2023-04-29 11:26:49,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +51: [2023-04-29 11:26:49,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 11:26:49,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +35: [2023-04-29 11:26:49,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +51: [2023-04-29 11:26:49,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 11:26:49,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 11:26:49,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 8: [2023-04-29 11:26:49,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +51: [2023-04-29 11:26:49,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 11:26:49,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 11:26:49,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +35: [2023-04-29 11:26:49,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +30: [2023-04-29 11:26:49,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +30: [2023-04-29 11:26:49,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +30: [2023-04-29 11:26:49,851] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +30: [2023-04-29 11:26:49,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +14: [2023-04-29 11:26:49,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 11:26:49,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 11:26:49,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +62: [2023-04-29 11:26:49,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 11:26:49,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 11:26:49,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 5: [2023-04-29 11:26:49,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +33: [2023-04-29 11:26:49,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 11:26:49,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 9: [2023-04-29 11:26:49,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 9: [2023-04-29 11:26:49,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 9: [2023-04-29 11:26:49,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +26: [2023-04-29 11:26:49,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +26: [2023-04-29 11:26:49,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 11:26:49,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 11:26:49,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 11:26:49,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 11:26:49,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +16: [2023-04-29 11:26:49,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +33: [2023-04-29 11:26:49,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 11:26:49,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +27: [2023-04-29 11:26:49,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 11:26:49,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +16: [2023-04-29 11:26:49,863] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 1: [2023-04-29 11:26:49,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +27: [2023-04-29 11:26:49,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +24: [2023-04-29 11:26:49,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 11:26:49,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +11: [2023-04-29 11:26:49,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 11:26:49,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 11:26:49,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 11:26:49,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +29: [2023-04-29 11:26:49,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +29: [2023-04-29 11:26:49,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +29: [2023-04-29 11:26:49,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +24: [2023-04-29 11:26:49,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +29: [2023-04-29 11:26:49,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +25: [2023-04-29 11:26:49,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +25: [2023-04-29 11:26:49,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +25: [2023-04-29 11:26:49,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +25: [2023-04-29 11:26:49,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +27: [2023-04-29 11:26:49,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 11:26:49,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 11:26:49,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +16: [2023-04-29 11:26:49,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 1: [2023-04-29 11:26:49,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +39: [2023-04-29 11:26:49,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 11:26:49,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 11:26:49,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 11:26:49,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +60: [2023-04-29 11:26:49,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +60: [2023-04-29 11:26:49,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 11:26:49,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +11: [2023-04-29 11:26:49,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +60: [2023-04-29 11:26:49,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 11:26:49,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +62: [2023-04-29 11:26:49,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 8: [2023-04-29 11:26:49,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 8: [2023-04-29 11:26:49,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +62: [2023-04-29 11:26:49,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 11:26:49,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +49: [2023-04-29 11:26:49,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +62: [2023-04-29 11:26:49,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 11:26:49,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +49: [2023-04-29 11:26:49,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. + 8: [2023-04-29 11:26:49,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 8: [2023-04-29 11:26:49,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 8: [2023-04-29 11:26:49,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 9: [2023-04-29 11:26:49,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +42: [2023-04-29 11:26:49,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 11:26:49,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +58: [2023-04-29 11:26:49,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +58: [2023-04-29 11:26:49,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +58: [2023-04-29 11:26:49,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +47: [2023-04-29 11:26:49,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +47: [2023-04-29 11:26:49,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 11:26:49,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 11:26:49,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 11:26:49,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 11:26:49,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 11:26:49,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +47: [2023-04-29 11:26:49,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 11:26:49,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 11:26:49,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 11:26:49,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 11:26:49,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +29: [2023-04-29 11:26:49,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 11:26:49,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +33: [2023-04-29 11:26:49,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +29: [2023-04-29 11:26:49,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 11:26:49,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 11:26:49,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:49,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 11:26:49,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +47: [2023-04-29 11:26:49,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +42: [2023-04-29 11:26:49,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 11:26:49,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +42: [2023-04-29 11:26:49,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +10: [2023-04-29 11:26:49,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +32: [2023-04-29 11:26:49,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +32: [2023-04-29 11:26:49,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +33: [2023-04-29 11:26:49,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +29: [2023-04-29 11:26:49,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +14: [2023-04-29 11:26:49,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 11:26:49,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:49,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +32: [2023-04-29 11:26:49,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +11: [2023-04-29 11:26:49,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +50: [2023-04-29 11:26:49,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +14: [2023-04-29 11:26:49,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +49: [2023-04-29 11:26:49,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +49: [2023-04-29 11:26:49,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +49: [2023-04-29 11:26:49,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +28: [2023-04-29 11:26:49,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +28: [2023-04-29 11:26:49,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +28: [2023-04-29 11:26:49,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +11: [2023-04-29 11:26:49,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +28: [2023-04-29 11:26:49,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +11: [2023-04-29 11:26:49,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +49: [2023-04-29 11:26:49,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +30: [2023-04-29 11:26:49,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +50: [2023-04-29 11:26:49,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +50: [2023-04-29 11:26:49,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +58: [2023-04-29 11:26:49,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 11:26:49,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 11:26:49,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 11:26:49,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 11:26:49,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +42: [2023-04-29 11:26:49,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +30: [2023-04-29 11:26:49,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +11: [2023-04-29 11:26:49,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +47: [2023-04-29 11:26:49,916] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +11: [2023-04-29 11:26:49,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 11:26:49,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 11:26:49,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 11:26:49,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 11:26:49,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 11:26:49,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +51: [2023-04-29 11:26:49,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 11:26:49,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +27: [2023-04-29 11:26:49,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +14: [2023-04-29 11:26:49,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 11:26:49,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 11:26:49,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +30: [2023-04-29 11:26:49,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +30: [2023-04-29 11:26:49,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +51: [2023-04-29 11:26:49,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 11:26:49,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +11: [2023-04-29 11:26:49,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +50: [2023-04-29 11:26:49,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 11:26:49,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +30: [2023-04-29 11:26:49,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 2: [2023-04-29 11:26:49,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +14: [2023-04-29 11:26:49,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +27: [2023-04-29 11:26:49,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +14: [2023-04-29 11:26:49,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +30: [2023-04-29 11:26:49,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 2: [2023-04-29 11:26:49,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:49,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:49,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:49,925] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 11:26:49,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +31: [2023-04-29 11:26:49,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +31: [2023-04-29 11:26:49,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +30: [2023-04-29 11:26:49,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +31: [2023-04-29 11:26:49,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 2: [2023-04-29 11:26:49,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +36: [2023-04-29 11:26:49,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +36: [2023-04-29 11:26:49,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +27: [2023-04-29 11:26:49,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 11:26:49,927] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 11:26:49,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 2: [2023-04-29 11:26:49,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +36: [2023-04-29 11:26:49,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +36: [2023-04-29 11:26:49,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +32: [2023-04-29 11:26:49,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +24: [2023-04-29 11:26:49,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +42: [2023-04-29 11:26:49,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +42: [2023-04-29 11:26:49,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +28: [2023-04-29 11:26:49,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +27: [2023-04-29 11:26:49,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +32: [2023-04-29 11:26:49,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 11:26:49,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 11:26:49,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +24: [2023-04-29 11:26:49,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +27: [2023-04-29 11:26:49,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 11:26:49,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +28: [2023-04-29 11:26:49,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:49,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +20: [2023-04-29 11:26:49,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +20: [2023-04-29 11:26:49,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +20: [2023-04-29 11:26:49,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +20: [2023-04-29 11:26:49,933] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +50: [2023-04-29 11:26:49,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 4: [2023-04-29 11:26:49,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 4: [2023-04-29 11:26:49,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 4: [2023-04-29 11:26:49,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +27: [2023-04-29 11:26:49,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 11:26:49,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +39: [2023-04-29 11:26:49,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +28: [2023-04-29 11:26:49,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +32: [2023-04-29 11:26:49,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +27: [2023-04-29 11:26:49,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +15: [2023-04-29 11:26:49,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +15: [2023-04-29 11:26:49,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +15: [2023-04-29 11:26:49,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +15: [2023-04-29 11:26:49,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +51: [2023-04-29 11:26:49,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 11:26:49,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 11:26:49,940] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +27: [2023-04-29 11:26:49,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +24: [2023-04-29 11:26:49,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 5: [2023-04-29 11:26:49,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 5: [2023-04-29 11:26:49,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +50: [2023-04-29 11:26:49,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +35: [2023-04-29 11:26:49,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +35: [2023-04-29 11:26:49,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +35: [2023-04-29 11:26:49,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +35: [2023-04-29 11:26:49,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +35: [2023-04-29 11:26:49,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +35: [2023-04-29 11:26:49,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +35: [2023-04-29 11:26:49,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +35: [2023-04-29 11:26:49,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +24: [2023-04-29 11:26:49,944] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +50: [2023-04-29 11:26:49,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 11:26:49,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +39: [2023-04-29 11:26:49,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 9: [2023-04-29 11:26:49,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +39: [2023-04-29 11:26:49,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 9: [2023-04-29 11:26:49,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +51: [2023-04-29 11:26:49,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 11:26:49,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +24: [2023-04-29 11:26:49,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 9: [2023-04-29 11:26:49,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +35: [2023-04-29 11:26:49,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +35: [2023-04-29 11:26:49,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +29: [2023-04-29 11:26:49,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +24: [2023-04-29 11:26:49,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +35: [2023-04-29 11:26:49,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +48: [2023-04-29 11:26:49,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +48: [2023-04-29 11:26:49,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +35: [2023-04-29 11:26:49,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... +35: [2023-04-29 11:26:49,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt... + 9: [2023-04-29 11:26:49,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +51: [2023-04-29 11:26:49,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 11:26:49,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +36: [2023-04-29 11:26:49,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +35: [2023-04-29 11:26:49,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +35: [2023-04-29 11:26:49,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +48: [2023-04-29 11:26:49,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +48: [2023-04-29 11:26:49,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +31: [2023-04-29 11:26:49,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 11:26:49,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt... +31: [2023-04-29 11:26:49,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +29: [2023-04-29 11:26:49,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +46: [2023-04-29 11:26:49,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +46: [2023-04-29 11:26:49,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +22: [2023-04-29 11:26:49,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +22: [2023-04-29 11:26:49,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +39: [2023-04-29 11:26:49,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +31: [2023-04-29 11:26:49,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +22: [2023-04-29 11:26:49,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +36: [2023-04-29 11:26:49,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 11:26:49,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +22: [2023-04-29 11:26:49,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +36: [2023-04-29 11:26:49,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +10: [2023-04-29 11:26:49,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +46: [2023-04-29 11:26:49,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +46: [2023-04-29 11:26:49,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +20: [2023-04-29 11:26:49,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 11:26:49,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 9: [2023-04-29 11:26:49,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +25: [2023-04-29 11:26:49,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 11:26:49,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +13: [2023-04-29 11:26:49,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +13: [2023-04-29 11:26:49,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +13: [2023-04-29 11:26:49,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 9: [2023-04-29 11:26:49,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +29: [2023-04-29 11:26:49,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 11:26:49,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 11:26:49,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 11:26:49,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 11:26:49,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 11:26:49,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 11:26:49,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 11:26:49,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 11:26:49,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +20: [2023-04-29 11:26:49,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 11:26:49,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 11:26:49,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 11:26:49,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +63: [2023-04-29 11:26:49,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 11:26:49,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 11:26:49,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 11:26:49,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +23: [2023-04-29 11:26:49,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 11:26:49,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +29: [2023-04-29 11:26:49,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 4: [2023-04-29 11:26:49,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:49,968] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 11:26:49,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +25: [2023-04-29 11:26:49,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 5: [2023-04-29 11:26:49,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +25: [2023-04-29 11:26:49,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 1: [2023-04-29 11:26:49,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +23: [2023-04-29 11:26:49,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +25: [2023-04-29 11:26:49,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +10: [2023-04-29 11:26:49,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 11:26:49,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +63: [2023-04-29 11:26:49,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 11:26:49,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 11:26:49,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 11:26:49,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 0: [2023-04-29 11:26:49,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +15: [2023-04-29 11:26:49,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 11:26:49,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 11:26:49,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +15: [2023-04-29 11:26:49,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 11:26:49,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 0: [2023-04-29 11:26:49,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 1: [2023-04-29 11:26:49,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +10: [2023-04-29 11:26:49,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 11:26:49,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 11:26:49,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 11:26:49,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 5: [2023-04-29 11:26:49,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +63: [2023-04-29 11:26:49,975] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +29: [2023-04-29 11:26:49,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +48: [2023-04-29 11:26:49,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +16: [2023-04-29 11:26:49,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +16: [2023-04-29 11:26:49,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +19: [2023-04-29 11:26:49,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 11:26:49,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 6: [2023-04-29 11:26:49,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +48: [2023-04-29 11:26:49,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +48: [2023-04-29 11:26:49,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +19: [2023-04-29 11:26:49,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 11:26:49,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 11:26:49,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +22: [2023-04-29 11:26:49,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +22: [2023-04-29 11:26:49,982] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +43: [2023-04-29 11:26:49,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 11:26:49,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 11:26:49,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 11:26:49,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 11:26:49,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +16: [2023-04-29 11:26:49,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 6: [2023-04-29 11:26:49,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 11:26:49,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 6: [2023-04-29 11:26:49,983] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 11:26:49,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 11:26:49,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 11:26:49,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 11:26:49,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +10: [2023-04-29 11:26:49,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +10: [2023-04-29 11:26:49,984] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +19: [2023-04-29 11:26:49,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 11:26:49,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +46: [2023-04-29 11:26:49,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +19: [2023-04-29 11:26:49,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 11:26:49,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +16: [2023-04-29 11:26:49,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 6: [2023-04-29 11:26:49,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 11:26:49,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +46: [2023-04-29 11:26:49,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 6: [2023-04-29 11:26:49,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 11:26:49,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +46: [2023-04-29 11:26:49,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +46: [2023-04-29 11:26:49,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +22: [2023-04-29 11:26:49,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 11:26:49,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +43: [2023-04-29 11:26:49,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:49,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +58: [2023-04-29 11:26:49,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 11:26:49,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 11:26:49,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 11:26:49,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:49,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +58: [2023-04-29 11:26:49,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 11:26:49,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 11:26:49,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 11:26:49,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +11: [2023-04-29 11:26:49,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 11:26:49,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +39: [2023-04-29 11:26:49,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +58: [2023-04-29 11:26:49,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 11:26:49,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +13: [2023-04-29 11:26:49,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +13: [2023-04-29 11:26:49,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 11:26:49,989] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 11:26:49,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +60: [2023-04-29 11:26:49,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 11:26:49,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 11:26:49,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 11:26:49,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 11:26:49,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 11:26:49,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 11:26:49,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 11:26:49,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 11:26:49,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 11:26:49,992] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +13: [2023-04-29 11:26:49,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 4: [2023-04-29 11:26:49,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +58: [2023-04-29 11:26:49,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +58: [2023-04-29 11:26:49,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +45: [2023-04-29 11:26:49,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +58: [2023-04-29 11:26:49,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 11:26:49,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +45: [2023-04-29 11:26:49,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +45: [2023-04-29 11:26:49,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +58: [2023-04-29 11:26:49,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 11:26:49,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +58: [2023-04-29 11:26:49,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 11:26:49,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 11:26:49,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +60: [2023-04-29 11:26:49,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +60: [2023-04-29 11:26:49,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +60: [2023-04-29 11:26:49,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +60: [2023-04-29 11:26:49,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +60: [2023-04-29 11:26:49,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +28: [2023-04-29 11:26:49,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 7: [2023-04-29 11:26:49,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 7: [2023-04-29 11:26:49,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +28: [2023-04-29 11:26:49,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 11:26:49,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +21: [2023-04-29 11:26:49,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 2: [2023-04-29 11:26:50,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 11:26:50,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +60: [2023-04-29 11:26:50,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +60: [2023-04-29 11:26:50,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 7: [2023-04-29 11:26:50,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 7: [2023-04-29 11:26:50,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +21: [2023-04-29 11:26:50,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +11: [2023-04-29 11:26:50,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 11:26:50,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 11:26:50,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +60: [2023-04-29 11:26:50,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +21: [2023-04-29 11:26:50,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +28: [2023-04-29 11:26:50,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +28: [2023-04-29 11:26:50,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 0: [2023-04-29 11:26:50,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +35: [2023-04-29 11:26:50,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 11:26:50,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +16: [2023-04-29 11:26:50,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +11: [2023-04-29 11:26:50,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +16: [2023-04-29 11:26:50,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 11:26:50,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 11:26:50,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 2: [2023-04-29 11:26:50,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 2: [2023-04-29 11:26:50,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. + 4: [2023-04-29 11:26:50,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +38: [2023-04-29 11:26:50,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 11:26:50,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 11:26:50,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 11:26:50,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 11:26:50,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 11:26:50,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 11:26:50,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 11:26:50,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +16: [2023-04-29 11:26:50,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +10: [2023-04-29 11:26:50,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 11:26:50,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +28: [2023-04-29 11:26:50,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 11:26:50,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +38: [2023-04-29 11:26:50,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +35: [2023-04-29 11:26:50,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +38: [2023-04-29 11:26:50,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +38: [2023-04-29 11:26:50,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +16: [2023-04-29 11:26:50,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +38: [2023-04-29 11:26:50,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +38: [2023-04-29 11:26:50,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 11:26:50,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +38: [2023-04-29 11:26:50,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +31: [2023-04-29 11:26:50,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +10: [2023-04-29 11:26:50,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +45: [2023-04-29 11:26:50,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +28: [2023-04-29 11:26:50,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +20: [2023-04-29 11:26:50,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +10: [2023-04-29 11:26:50,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 11:26:50,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 11:26:50,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +31: [2023-04-29 11:26:50,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +45: [2023-04-29 11:26:50,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 11:26:50,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +45: [2023-04-29 11:26:50,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +10: [2023-04-29 11:26:50,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +23: [2023-04-29 11:26:50,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +45: [2023-04-29 11:26:50,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +35: [2023-04-29 11:26:50,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 11:26:50,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 2: [2023-04-29 11:26:50,027] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 11:26:50,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +31: [2023-04-29 11:26:50,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 2: [2023-04-29 11:26:50,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 11:26:50,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +31: [2023-04-29 11:26:50,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 5: [2023-04-29 11:26:50,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +35: [2023-04-29 11:26:50,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_00-model_states.pt. +20: [2023-04-29 11:26:50,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +21: [2023-04-29 11:26:50,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +21: [2023-04-29 11:26:50,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +35: [2023-04-29 11:26:50,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +15: [2023-04-29 11:26:50,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +20: [2023-04-29 11:26:50,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 11:26:50,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +23: [2023-04-29 11:26:50,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 11:26:50,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +34: [2023-04-29 11:26:50,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +11: [2023-04-29 11:26:50,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +34: [2023-04-29 11:26:50,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +34: [2023-04-29 11:26:50,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +59: [2023-04-29 11:26:50,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +59: [2023-04-29 11:26:50,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +11: [2023-04-29 11:26:50,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +34: [2023-04-29 11:26:50,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +15: [2023-04-29 11:26:50,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +43: [2023-04-29 11:26:50,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +43: [2023-04-29 11:26:50,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +20: [2023-04-29 11:26:50,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +43: [2023-04-29 11:26:50,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +59: [2023-04-29 11:26:50,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +43: [2023-04-29 11:26:50,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +59: [2023-04-29 11:26:50,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +20: [2023-04-29 11:26:50,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +19: [2023-04-29 11:26:50,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +63: [2023-04-29 11:26:50,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 3: [2023-04-29 11:26:50,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 5: [2023-04-29 11:26:50,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +20: [2023-04-29 11:26:50,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 2: [2023-04-29 11:26:50,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +15: [2023-04-29 11:26:50,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 11:26:50,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 11:26:50,044] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +35: [2023-04-29 11:26:50,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 2: [2023-04-29 11:26:50,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +22: [2023-04-29 11:26:50,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +23: [2023-04-29 11:26:50,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 3: [2023-04-29 11:26:50,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +63: [2023-04-29 11:26:50,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 11:26:50,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 11:26:50,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +22: [2023-04-29 11:26:50,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +23: [2023-04-29 11:26:50,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 11:26:50,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +15: [2023-04-29 11:26:50,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +15: [2023-04-29 11:26:50,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +19: [2023-04-29 11:26:50,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +39: [2023-04-29 11:26:50,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +22: [2023-04-29 11:26:50,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +57: [2023-04-29 11:26:50,052] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +57: [2023-04-29 11:26:50,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +57: [2023-04-29 11:26:50,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +57: [2023-04-29 11:26:50,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +23: [2023-04-29 11:26:50,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 11:26:50,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 4: [2023-04-29 11:26:50,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +62: [2023-04-29 11:26:50,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +62: [2023-04-29 11:26:50,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +19: [2023-04-29 11:26:50,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 11:26:50,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 4: [2023-04-29 11:26:50,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +62: [2023-04-29 11:26:50,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +62: [2023-04-29 11:26:50,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. + 3: [2023-04-29 11:26:50,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +60: [2023-04-29 11:26:50,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 11:26:50,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 11:26:50,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 11:26:50,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +22: [2023-04-29 11:26:50,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +35: [2023-04-29 11:26:50,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +23: [2023-04-29 11:26:50,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +60: [2023-04-29 11:26:50,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 11:26:50,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +22: [2023-04-29 11:26:50,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +34: [2023-04-29 11:26:50,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +34: [2023-04-29 11:26:50,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +13: [2023-04-29 11:26:50,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 11:26:50,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +13: [2023-04-29 11:26:50,061] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 11:26:50,062] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +59: [2023-04-29 11:26:50,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +35: [2023-04-29 11:26:50,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 11:26:50,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 11:26:50,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +58: [2023-04-29 11:26:50,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 11:26:50,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +58: [2023-04-29 11:26:50,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 11:26:50,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +34: [2023-04-29 11:26:50,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 11:26:50,065] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +13: [2023-04-29 11:26:50,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +22: [2023-04-29 11:26:50,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 7: [2023-04-29 11:26:50,067] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +38: [2023-04-29 11:26:50,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 11:26:50,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +13: [2023-04-29 11:26:50,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +13: [2023-04-29 11:26:50,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +13: [2023-04-29 11:26:50,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +59: [2023-04-29 11:26:50,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 11:26:50,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +58: [2023-04-29 11:26:50,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +43: [2023-04-29 11:26:50,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:50,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +22: [2023-04-29 11:26:50,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +39: [2023-04-29 11:26:50,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +43: [2023-04-29 11:26:50,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +13: [2023-04-29 11:26:50,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 6: [2023-04-29 11:26:50,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +43: [2023-04-29 11:26:50,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 11:26:50,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 11:26:50,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 11:26:50,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 11:26:50,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +39: [2023-04-29 11:26:50,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +19: [2023-04-29 11:26:50,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +60: [2023-04-29 11:26:50,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 11:26:50,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +23: [2023-04-29 11:26:50,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +60: [2023-04-29 11:26:50,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 11:26:50,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +23: [2023-04-29 11:26:50,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 11:26:50,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +54: [2023-04-29 11:26:50,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 11:26:50,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 11:26:50,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 11:26:50,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 11:26:50,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 11:26:50,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 11:26:50,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 11:26:50,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 11:26:50,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +10: [2023-04-29 11:26:50,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +55: [2023-04-29 11:26:50,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +27: [2023-04-29 11:26:50,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +55: [2023-04-29 11:26:50,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +27: [2023-04-29 11:26:50,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +55: [2023-04-29 11:26:50,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +19: [2023-04-29 11:26:50,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +27: [2023-04-29 11:26:50,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 11:26:50,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +63: [2023-04-29 11:26:50,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 11:26:50,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 11:26:50,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +57: [2023-04-29 11:26:50,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +19: [2023-04-29 11:26:50,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +21: [2023-04-29 11:26:50,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +16: [2023-04-29 11:26:50,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +62: [2023-04-29 11:26:50,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +62: [2023-04-29 11:26:50,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +62: [2023-04-29 11:26:50,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +26: [2023-04-29 11:26:50,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +26: [2023-04-29 11:26:50,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +63: [2023-04-29 11:26:50,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +63: [2023-04-29 11:26:50,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +63: [2023-04-29 11:26:50,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +57: [2023-04-29 11:26:50,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +54: [2023-04-29 11:26:50,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +57: [2023-04-29 11:26:50,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +54: [2023-04-29 11:26:50,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +54: [2023-04-29 11:26:50,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 11:26:50,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +54: [2023-04-29 11:26:50,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +62: [2023-04-29 11:26:50,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:50,085] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +43: [2023-04-29 11:26:50,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +60: [2023-04-29 11:26:50,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +10: [2023-04-29 11:26:50,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +63: [2023-04-29 11:26:50,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +54: [2023-04-29 11:26:50,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +60: [2023-04-29 11:26:50,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 11:26:50,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 11:26:50,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 7: [2023-04-29 11:26:50,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +26: [2023-04-29 11:26:50,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +26: [2023-04-29 11:26:50,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_17-model_01-model_states.pt. +54: [2023-04-29 11:26:50,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +54: [2023-04-29 11:26:50,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 11:26:50,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 11:26:50,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 11:26:50,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +10: [2023-04-29 11:26:50,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +38: [2023-04-29 11:26:50,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +58: [2023-04-29 11:26:50,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +33: [2023-04-29 11:26:50,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +33: [2023-04-29 11:26:50,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. + 9: [2023-04-29 11:26:50,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +33: [2023-04-29 11:26:50,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +33: [2023-04-29 11:26:50,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +16: [2023-04-29 11:26:50,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +38: [2023-04-29 11:26:50,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +58: [2023-04-29 11:26:50,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 11:26:50,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +53: [2023-04-29 11:26:50,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +53: [2023-04-29 11:26:50,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. + 9: [2023-04-29 11:26:50,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 11:26:50,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 11:26:50,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +53: [2023-04-29 11:26:50,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. + 0: [2023-04-29 11:26:50,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +21: [2023-04-29 11:26:50,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +21: [2023-04-29 11:26:50,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +16: [2023-04-29 11:26:50,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +44: [2023-04-29 11:26:50,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +44: [2023-04-29 11:26:50,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +44: [2023-04-29 11:26:50,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +44: [2023-04-29 11:26:50,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +16: [2023-04-29 11:26:50,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 9: [2023-04-29 11:26:50,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +21: [2023-04-29 11:26:50,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +58: [2023-04-29 11:26:50,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +39: [2023-04-29 11:26:50,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +43: [2023-04-29 11:26:50,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 11:26:50,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +39: [2023-04-29 11:26:50,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +58: [2023-04-29 11:26:50,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +16: [2023-04-29 11:26:50,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +10: [2023-04-29 11:26:50,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 0: [2023-04-29 11:26:50,104] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +43: [2023-04-29 11:26:50,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 11:26:50,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +10: [2023-04-29 11:26:50,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +21: [2023-04-29 11:26:50,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +21: [2023-04-29 11:26:50,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +55: [2023-04-29 11:26:50,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 11:26:50,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 0: [2023-04-29 11:26:50,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +56: [2023-04-29 11:26:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +56: [2023-04-29 11:26:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +40: [2023-04-29 11:26:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +40: [2023-04-29 11:26:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +40: [2023-04-29 11:26:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +56: [2023-04-29 11:26:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +37: [2023-04-29 11:26:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +37: [2023-04-29 11:26:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +56: [2023-04-29 11:26:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +40: [2023-04-29 11:26:50,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +60: [2023-04-29 11:26:50,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +55: [2023-04-29 11:26:50,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +37: [2023-04-29 11:26:50,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. + 2: [2023-04-29 11:26:50,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +52: [2023-04-29 11:26:50,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +52: [2023-04-29 11:26:50,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +37: [2023-04-29 11:26:50,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +52: [2023-04-29 11:26:50,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +26: [2023-04-29 11:26:50,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +52: [2023-04-29 11:26:50,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. + 1: [2023-04-29 11:26:50,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +60: [2023-04-29 11:26:50,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +55: [2023-04-29 11:26:50,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +55: [2023-04-29 11:26:50,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 11:26:50,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +56: [2023-04-29 11:26:50,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +56: [2023-04-29 11:26:50,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +56: [2023-04-29 11:26:50,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +26: [2023-04-29 11:26:50,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 11:26:50,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 11:26:50,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 11:26:50,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +63: [2023-04-29 11:26:50,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +63: [2023-04-29 11:26:50,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +32: [2023-04-29 11:26:50,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 11:26:50,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 11:26:50,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +44: [2023-04-29 11:26:50,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 11:26:50,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 11:26:50,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 11:26:50,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 11:26:50,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 11:26:50,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 11:26:50,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 11:26:50,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 11:26:50,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +63: [2023-04-29 11:26:50,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +63: [2023-04-29 11:26:50,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 11:26:50,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 11:26:50,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 11:26:50,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,124] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +53: [2023-04-29 11:26:50,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 11:26:50,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt... +56: [2023-04-29 11:26:50,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 11:26:50,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 11:26:50,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 11:26:50,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 11:26:50,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 7: [2023-04-29 11:26:50,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 7: [2023-04-29 11:26:50,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +56: [2023-04-29 11:26:50,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +33: [2023-04-29 11:26:50,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +12: [2023-04-29 11:26:50,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +12: [2023-04-29 11:26:50,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +12: [2023-04-29 11:26:50,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +33: [2023-04-29 11:26:50,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 11:26:50,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +12: [2023-04-29 11:26:50,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 2: [2023-04-29 11:26:50,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... + 3: [2023-04-29 11:26:50,130] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +36: [2023-04-29 11:26:50,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 11:26:50,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 11:26:50,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 11:26:50,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 11:26:50,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 11:26:50,132] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +36: [2023-04-29 11:26:50,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 11:26:50,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 11:26:50,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 11:26:50,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +43: [2023-04-29 11:26:50,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 11:26:50,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +19: [2023-04-29 11:26:50,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +19: [2023-04-29 11:26:50,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +32: [2023-04-29 11:26:50,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +19: [2023-04-29 11:26:50,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +19: [2023-04-29 11:26:50,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +32: [2023-04-29 11:26:50,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 11:26:50,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 11:26:50,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 11:26:50,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 11:26:50,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 11:26:50,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +36: [2023-04-29 11:26:50,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +36: [2023-04-29 11:26:50,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +37: [2023-04-29 11:26:50,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 11:26:50,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 11:26:50,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 11:26:50,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +52: [2023-04-29 11:26:50,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 11:26:50,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 11:26:50,139] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 11:26:50,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +36: [2023-04-29 11:26:50,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +36: [2023-04-29 11:26:50,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +40: [2023-04-29 11:26:50,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +43: [2023-04-29 11:26:50,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 11:26:50,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +56: [2023-04-29 11:26:50,144] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +40: [2023-04-29 11:26:50,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +40: [2023-04-29 11:26:50,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +37: [2023-04-29 11:26:50,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +54: [2023-04-29 11:26:50,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 11:26:50,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +27: [2023-04-29 11:26:50,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 11:26:50,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 11:26:50,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 11:26:50,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +51: [2023-04-29 11:26:50,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +51: [2023-04-29 11:26:50,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +51: [2023-04-29 11:26:50,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +18: [2023-04-29 11:26:50,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +43: [2023-04-29 11:26:50,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 11:26:50,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. + 3: [2023-04-29 11:26:50,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +37: [2023-04-29 11:26:50,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 11:26:50,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +43: [2023-04-29 11:26:50,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +43: [2023-04-29 11:26:50,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +54: [2023-04-29 11:26:50,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +56: [2023-04-29 11:26:50,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 11:26:50,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 11:26:50,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 11:26:50,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 11:26:50,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 11:26:50,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 11:26:50,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 11:26:50,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 11:26:50,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +43: [2023-04-29 11:26:50,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +28: [2023-04-29 11:26:50,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +28: [2023-04-29 11:26:50,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 11:26:50,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 11:26:50,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 11:26:50,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 11:26:50,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 11:26:50,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +43: [2023-04-29 11:26:50,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +16: [2023-04-29 11:26:50,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 11:26:50,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +12: [2023-04-29 11:26:50,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +12: [2023-04-29 11:26:50,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +54: [2023-04-29 11:26:50,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +28: [2023-04-29 11:26:50,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 11:26:50,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 11:26:50,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 11:26:50,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +17: [2023-04-29 11:26:50,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +17: [2023-04-29 11:26:50,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +17: [2023-04-29 11:26:50,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +19: [2023-04-29 11:26:50,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 11:26:50,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 11:26:50,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +54: [2023-04-29 11:26:50,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +28: [2023-04-29 11:26:50,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 11:26:50,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +16: [2023-04-29 11:26:50,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 11:26:50,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 11:26:50,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 11:26:50,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +48: [2023-04-29 11:26:50,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 11:26:50,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 11:26:50,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 11:26:50,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 11:26:50,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 11:26:50,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 11:26:50,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 11:26:50,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 3: [2023-04-29 11:26:50,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +48: [2023-04-29 11:26:50,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +48: [2023-04-29 11:26:50,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +54: [2023-04-29 11:26:50,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +48: [2023-04-29 11:26:50,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +48: [2023-04-29 11:26:50,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +48: [2023-04-29 11:26:50,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +48: [2023-04-29 11:26:50,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +27: [2023-04-29 11:26:50,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +48: [2023-04-29 11:26:50,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +51: [2023-04-29 11:26:50,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 11:26:50,175] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 11:26:50,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +39: [2023-04-29 11:26:50,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +39: [2023-04-29 11:26:50,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +39: [2023-04-29 11:26:50,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +26: [2023-04-29 11:26:50,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 11:26:50,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 11:26:50,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 11:26:50,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 11:26:50,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +30: [2023-04-29 11:26:50,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 11:26:50,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 11:26:50,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 11:26:50,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,179] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +26: [2023-04-29 11:26:50,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +26: [2023-04-29 11:26:50,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +27: [2023-04-29 11:26:50,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 11:26:50,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 11:26:50,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 11:26:50,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 11:26:50,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 11:26:50,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 11:26:50,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +17: [2023-04-29 11:26:50,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +41: [2023-04-29 11:26:50,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +41: [2023-04-29 11:26:50,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +41: [2023-04-29 11:26:50,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +41: [2023-04-29 11:26:50,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +26: [2023-04-29 11:26:50,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +63: [2023-04-29 11:26:50,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +63: [2023-04-29 11:26:50,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +17: [2023-04-29 11:26:50,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +54: [2023-04-29 11:26:50,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,188] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 11:26:50,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +54: [2023-04-29 11:26:50,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +17: [2023-04-29 11:26:50,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +61: [2023-04-29 11:26:50,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +61: [2023-04-29 11:26:50,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. + 0: [2023-04-29 11:26:50,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +56: [2023-04-29 11:26:50,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 11:26:50,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +63: [2023-04-29 11:26:50,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +61: [2023-04-29 11:26:50,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +26: [2023-04-29 11:26:50,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +63: [2023-04-29 11:26:50,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +63: [2023-04-29 11:26:50,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 11:26:50,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +26: [2023-04-29 11:26:50,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_00-model_states.pt. +56: [2023-04-29 11:26:50,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +36: [2023-04-29 11:26:50,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +63: [2023-04-29 11:26:50,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +49: [2023-04-29 11:26:50,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 11:26:50,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 11:26:50,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 11:26:50,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 11:26:50,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 11:26:50,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 11:26:50,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 11:26:50,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 11:26:50,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 9: [2023-04-29 11:26:50,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 11:26:50,201] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +39: [2023-04-29 11:26:50,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 11:26:50,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +26: [2023-04-29 11:26:50,204] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt... +39: [2023-04-29 11:26:50,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +62: [2023-04-29 11:26:50,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 11:26:50,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 11:26:50,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +49: [2023-04-29 11:26:50,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +49: [2023-04-29 11:26:50,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +49: [2023-04-29 11:26:50,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +39: [2023-04-29 11:26:50,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 11:26:50,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 9: [2023-04-29 11:26:50,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +47: [2023-04-29 11:26:50,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +47: [2023-04-29 11:26:50,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +49: [2023-04-29 11:26:50,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 11:26:50,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 11:26:50,209] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +12: [2023-04-29 11:26:50,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +62: [2023-04-29 11:26:50,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 11:26:50,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 11:26:50,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 11:26:50,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 11:26:50,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 11:26:50,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 11:26:50,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 11:26:50,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 11:26:50,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +47: [2023-04-29 11:26:50,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +36: [2023-04-29 11:26:50,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 11:26:50,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +36: [2023-04-29 11:26:50,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +18: [2023-04-29 11:26:50,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 11:26:50,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +62: [2023-04-29 11:26:50,213] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +12: [2023-04-29 11:26:50,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +41: [2023-04-29 11:26:50,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +18: [2023-04-29 11:26:50,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +41: [2023-04-29 11:26:50,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +32: [2023-04-29 11:26:50,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 11:26:50,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 11:26:50,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 11:26:50,214] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 11:26:50,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 11:26:50,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 11:26:50,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 0: [2023-04-29 11:26:50,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +62: [2023-04-29 11:26:50,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +41: [2023-04-29 11:26:50,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +62: [2023-04-29 11:26:50,217] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +62: [2023-04-29 11:26:50,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +62: [2023-04-29 11:26:50,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +61: [2023-04-29 11:26:50,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +18: [2023-04-29 11:26:50,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +56: [2023-04-29 11:26:50,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 11:26:50,220] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 11:26:50,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 11:26:50,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 11:26:50,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 11:26:50,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 11:26:50,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 11:26:50,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 11:26:50,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +59: [2023-04-29 11:26:50,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,222] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 11:26:50,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 11:26:50,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:50,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 11:26:50,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 11:26:50,222] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +61: [2023-04-29 11:26:50,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +61: [2023-04-29 11:26:50,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +61: [2023-04-29 11:26:50,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +59: [2023-04-29 11:26:50,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +12: [2023-04-29 11:26:50,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +36: [2023-04-29 11:26:50,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +28: [2023-04-29 11:26:50,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 11:26:50,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +59: [2023-04-29 11:26:50,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +59: [2023-04-29 11:26:50,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +56: [2023-04-29 11:26:50,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +12: [2023-04-29 11:26:50,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +12: [2023-04-29 11:26:50,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +59: [2023-04-29 11:26:50,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 11:26:50,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +19: [2023-04-29 11:26:50,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +48: [2023-04-29 11:26:50,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +19: [2023-04-29 11:26:50,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 11:26:50,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +56: [2023-04-29 11:26:50,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +56: [2023-04-29 11:26:50,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +16: [2023-04-29 11:26:50,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +59: [2023-04-29 11:26:50,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +19: [2023-04-29 11:26:50,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +59: [2023-04-29 11:26:50,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +28: [2023-04-29 11:26:50,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +59: [2023-04-29 11:26:50,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +42: [2023-04-29 11:26:50,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +42: [2023-04-29 11:26:50,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +42: [2023-04-29 11:26:50,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +59: [2023-04-29 11:26:50,233] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +42: [2023-04-29 11:26:50,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +56: [2023-04-29 11:26:50,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +16: [2023-04-29 11:26:50,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 11:26:50,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +56: [2023-04-29 11:26:50,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +47: [2023-04-29 11:26:50,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 11:26:50,235] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +28: [2023-04-29 11:26:50,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +28: [2023-04-29 11:26:50,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +33: [2023-04-29 11:26:50,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 11:26:50,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 11:26:50,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 11:26:50,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 11:26:50,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 11:26:50,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 11:26:50,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +19: [2023-04-29 11:26:50,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +33: [2023-04-29 11:26:50,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +19: [2023-04-29 11:26:50,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +18: [2023-04-29 11:26:50,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +56: [2023-04-29 11:26:50,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 11:26:50,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 11:26:50,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 11:26:50,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 11:26:50,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 11:26:50,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 11:26:50,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 11:26:50,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 11:26:50,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 11:26:50,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 11:26:50,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +50: [2023-04-29 11:26:50,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +50: [2023-04-29 11:26:50,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +50: [2023-04-29 11:26:50,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +50: [2023-04-29 11:26:50,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +33: [2023-04-29 11:26:50,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 11:26:50,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +33: [2023-04-29 11:26:50,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +40: [2023-04-29 11:26:50,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 11:26:50,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 11:26:50,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 11:26:50,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 11:26:50,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 11:26:50,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 11:26:50,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 11:26:50,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +56: [2023-04-29 11:26:50,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +33: [2023-04-29 11:26:50,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +36: [2023-04-29 11:26:50,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +18: [2023-04-29 11:26:50,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +36: [2023-04-29 11:26:50,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +45: [2023-04-29 11:26:50,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 11:26:50,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +36: [2023-04-29 11:26:50,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +16: [2023-04-29 11:26:50,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +45: [2023-04-29 11:26:50,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 11:26:50,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 11:26:50,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +33: [2023-04-29 11:26:50,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +45: [2023-04-29 11:26:50,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +45: [2023-04-29 11:26:50,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +33: [2023-04-29 11:26:50,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +17: [2023-04-29 11:26:50,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +45: [2023-04-29 11:26:50,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 11:26:50,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 11:26:50,246] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +56: [2023-04-29 11:26:50,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 11:26:50,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +45: [2023-04-29 11:26:50,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +40: [2023-04-29 11:26:50,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +18: [2023-04-29 11:26:50,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +40: [2023-04-29 11:26:50,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +40: [2023-04-29 11:26:50,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +40: [2023-04-29 11:26:50,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +18: [2023-04-29 11:26:50,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 11:26:50,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +45: [2023-04-29 11:26:50,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 11:26:50,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +40: [2023-04-29 11:26:50,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +48: [2023-04-29 11:26:50,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 11:26:50,249] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +40: [2023-04-29 11:26:50,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +17: [2023-04-29 11:26:50,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +40: [2023-04-29 11:26:50,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +28: [2023-04-29 11:26:50,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 11:26:50,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 11:26:50,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 11:26:50,254] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +32: [2023-04-29 11:26:50,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 11:26:50,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 11:26:50,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 11:26:50,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +17: [2023-04-29 11:26:50,255] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +48: [2023-04-29 11:26:50,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 11:26:50,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 11:26:50,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 11:26:50,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +17: [2023-04-29 11:26:50,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +25: [2023-04-29 11:26:50,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 11:26:50,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +17: [2023-04-29 11:26:50,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +42: [2023-04-29 11:26:50,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +17: [2023-04-29 11:26:50,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +42: [2023-04-29 11:26:50,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +42: [2023-04-29 11:26:50,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +42: [2023-04-29 11:26:50,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 11:26:50,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 11:26:50,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 11:26:50,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 11:26:50,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 11:26:50,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +17: [2023-04-29 11:26:50,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +25: [2023-04-29 11:26:50,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 11:26:50,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:50,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +35: [2023-04-29 11:26:50,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +35: [2023-04-29 11:26:50,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +35: [2023-04-29 11:26:50,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. + 4: [2023-04-29 11:26:50,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +35: [2023-04-29 11:26:50,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_40-model_01-model_states.pt. +28: [2023-04-29 11:26:50,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +50: [2023-04-29 11:26:50,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +50: [2023-04-29 11:26:50,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 11:26:50,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 11:26:50,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +50: [2023-04-29 11:26:50,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +50: [2023-04-29 11:26:50,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +49: [2023-04-29 11:26:50,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +28: [2023-04-29 11:26:50,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 11:26:50,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +18: [2023-04-29 11:26:50,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +18: [2023-04-29 11:26:50,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +18: [2023-04-29 11:26:50,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +30: [2023-04-29 11:26:50,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +39: [2023-04-29 11:26:50,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +39: [2023-04-29 11:26:50,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +39: [2023-04-29 11:26:50,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +49: [2023-04-29 11:26:50,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +48: [2023-04-29 11:26:50,280] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +55: [2023-04-29 11:26:50,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 11:26:50,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 11:26:50,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 11:26:50,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 11:26:50,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 11:26:50,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 11:26:50,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 11:26:50,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 11:26:50,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 11:26:50,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +49: [2023-04-29 11:26:50,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 11:26:50,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 11:26:50,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +30: [2023-04-29 11:26:50,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +48: [2023-04-29 11:26:50,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 6: [2023-04-29 11:26:50,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 6: [2023-04-29 11:26:50,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +48: [2023-04-29 11:26:50,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +30: [2023-04-29 11:26:50,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:50,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +30: [2023-04-29 11:26:50,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:50,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +11: [2023-04-29 11:26:50,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +62: [2023-04-29 11:26:50,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 11:26:50,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +11: [2023-04-29 11:26:50,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 6: [2023-04-29 11:26:50,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +55: [2023-04-29 11:26:50,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 6: [2023-04-29 11:26:50,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +39: [2023-04-29 11:26:50,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 6: [2023-04-29 11:26:50,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +55: [2023-04-29 11:26:50,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +62: [2023-04-29 11:26:50,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +39: [2023-04-29 11:26:50,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +33: [2023-04-29 11:26:50,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 11:26:50,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +55: [2023-04-29 11:26:50,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +55: [2023-04-29 11:26:50,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +55: [2023-04-29 11:26:50,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +55: [2023-04-29 11:26:50,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 1: [2023-04-29 11:26:50,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 1: [2023-04-29 11:26:50,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 1: [2023-04-29 11:26:50,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +59: [2023-04-29 11:26:50,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +14: [2023-04-29 11:26:50,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +14: [2023-04-29 11:26:50,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +14: [2023-04-29 11:26:50,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +14: [2023-04-29 11:26:50,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +49: [2023-04-29 11:26:50,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +45: [2023-04-29 11:26:50,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +23: [2023-04-29 11:26:50,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +23: [2023-04-29 11:26:50,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +23: [2023-04-29 11:26:50,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +35: [2023-04-29 11:26:50,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +35: [2023-04-29 11:26:50,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +23: [2023-04-29 11:26:50,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +18: [2023-04-29 11:26:50,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +33: [2023-04-29 11:26:50,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 11:26:50,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 11:26:50,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +35: [2023-04-29 11:26:50,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +13: [2023-04-29 11:26:50,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 11:26:50,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 11:26:50,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +18: [2023-04-29 11:26:50,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +45: [2023-04-29 11:26:50,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +18: [2023-04-29 11:26:50,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +24: [2023-04-29 11:26:50,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 11:26:50,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 11:26:50,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 11:26:50,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 11:26:50,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 11:26:50,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 11:26:50,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +62: [2023-04-29 11:26:50,308] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 11:26:50,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +33: [2023-04-29 11:26:50,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 11:26:50,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +59: [2023-04-29 11:26:50,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +22: [2023-04-29 11:26:50,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 11:26:50,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +49: [2023-04-29 11:26:50,310] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 11:26:50,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +13: [2023-04-29 11:26:50,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 11:26:50,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +45: [2023-04-29 11:26:50,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +24: [2023-04-29 11:26:50,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 11:26:50,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 11:26:50,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 11:26:50,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 11:26:50,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 11:26:50,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +49: [2023-04-29 11:26:50,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 11:26:50,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 11:26:50,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +62: [2023-04-29 11:26:50,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +62: [2023-04-29 11:26:50,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +13: [2023-04-29 11:26:50,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 11:26:50,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +34: [2023-04-29 11:26:50,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 11:26:50,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +51: [2023-04-29 11:26:50,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 11:26:50,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 11:26:50,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 11:26:50,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 11:26:50,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 11:26:50,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 11:26:50,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 11:26:50,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 11:26:50,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +34: [2023-04-29 11:26:50,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 11:26:50,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 11:26:50,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 11:26:50,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 11:26:50,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 11:26:50,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 11:26:50,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 11:26:50,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +51: [2023-04-29 11:26:50,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +25: [2023-04-29 11:26:50,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +34: [2023-04-29 11:26:50,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +40: [2023-04-29 11:26:50,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +11: [2023-04-29 11:26:50,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +40: [2023-04-29 11:26:50,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 11:26:50,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +14: [2023-04-29 11:26:50,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +51: [2023-04-29 11:26:50,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +51: [2023-04-29 11:26:50,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +22: [2023-04-29 11:26:50,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +34: [2023-04-29 11:26:50,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +51: [2023-04-29 11:26:50,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 11:26:50,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +51: [2023-04-29 11:26:50,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 11:26:50,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 1: [2023-04-29 11:26:50,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +51: [2023-04-29 11:26:50,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +45: [2023-04-29 11:26:50,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 11:26:50,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +14: [2023-04-29 11:26:50,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 11:26:50,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 11:26:50,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 11:26:50,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +33: [2023-04-29 11:26:50,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,323] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +59: [2023-04-29 11:26:50,324] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +29: [2023-04-29 11:26:50,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 11:26:50,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 11:26:50,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 11:26:50,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 11:26:50,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 11:26:50,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 11:26:50,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +34: [2023-04-29 11:26:50,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +45: [2023-04-29 11:26:50,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +14: [2023-04-29 11:26:50,325] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +46: [2023-04-29 11:26:50,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 11:26:50,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 11:26:50,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 11:26:50,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 11:26:50,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 11:26:50,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 11:26:50,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +25: [2023-04-29 11:26:50,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +46: [2023-04-29 11:26:50,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 11:26:50,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +23: [2023-04-29 11:26:50,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +34: [2023-04-29 11:26:50,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +34: [2023-04-29 11:26:50,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +34: [2023-04-29 11:26:50,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +29: [2023-04-29 11:26:50,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 11:26:50,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 11:26:50,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +46: [2023-04-29 11:26:50,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +33: [2023-04-29 11:26:50,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +23: [2023-04-29 11:26:50,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 11:26:50,330] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +46: [2023-04-29 11:26:50,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +46: [2023-04-29 11:26:50,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +46: [2023-04-29 11:26:50,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +40: [2023-04-29 11:26:50,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 11:26:50,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 11:26:50,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 11:26:50,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 11:26:50,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +23: [2023-04-29 11:26:50,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +23: [2023-04-29 11:26:50,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +46: [2023-04-29 11:26:50,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +46: [2023-04-29 11:26:50,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +25: [2023-04-29 11:26:50,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +46: [2023-04-29 11:26:50,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +45: [2023-04-29 11:26:50,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 11:26:50,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +37: [2023-04-29 11:26:50,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 11:26:50,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 11:26:50,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 11:26:50,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 11:26:50,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 11:26:50,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 11:26:50,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 11:26:50,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,335] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +33: [2023-04-29 11:26:50,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +23: [2023-04-29 11:26:50,335] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 11:26:50,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +45: [2023-04-29 11:26:50,337] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +37: [2023-04-29 11:26:50,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +37: [2023-04-29 11:26:50,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +37: [2023-04-29 11:26:50,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +31: [2023-04-29 11:26:50,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 11:26:50,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 11:26:50,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 11:26:50,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 11:26:50,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 11:26:50,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 11:26:50,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 11:26:50,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +59: [2023-04-29 11:26:50,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 11:26:50,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 11:26:50,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 11:26:50,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +20: [2023-04-29 11:26:50,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +37: [2023-04-29 11:26:50,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +37: [2023-04-29 11:26:50,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +21: [2023-04-29 11:26:50,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 11:26:50,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +37: [2023-04-29 11:26:50,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +37: [2023-04-29 11:26:50,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +21: [2023-04-29 11:26:50,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 11:26:50,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +31: [2023-04-29 11:26:50,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +59: [2023-04-29 11:26:50,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 11:26:50,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +31: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +47: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +31: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +47: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +21: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +38: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +38: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +38: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +55: [2023-04-29 11:26:50,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 11:26:50,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +40: [2023-04-29 11:26:50,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +20: [2023-04-29 11:26:50,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 11:26:50,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +25: [2023-04-29 11:26:50,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +47: [2023-04-29 11:26:50,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +15: [2023-04-29 11:26:50,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +15: [2023-04-29 11:26:50,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +15: [2023-04-29 11:26:50,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +15: [2023-04-29 11:26:50,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +20: [2023-04-29 11:26:50,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +21: [2023-04-29 11:26:50,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 11:26:50,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +21: [2023-04-29 11:26:50,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +40: [2023-04-29 11:26:50,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 11:26:50,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 11:26:50,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 11:26:50,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +59: [2023-04-29 11:26:50,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 11:26:50,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +47: [2023-04-29 11:26:50,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +25: [2023-04-29 11:26:50,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +47: [2023-04-29 11:26:50,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +15: [2023-04-29 11:26:50,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 11:26:50,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 11:26:50,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 11:26:50,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 11:26:50,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +11: [2023-04-29 11:26:50,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +55: [2023-04-29 11:26:50,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 11:26:50,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +11: [2023-04-29 11:26:50,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 11:26:50,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 11:26:50,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +45: [2023-04-29 11:26:50,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +25: [2023-04-29 11:26:50,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:50,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 11:26:50,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 11:26:50,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 11:26:50,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 11:26:50,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +54: [2023-04-29 11:26:50,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +54: [2023-04-29 11:26:50,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +54: [2023-04-29 11:26:50,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +54: [2023-04-29 11:26:50,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +18: [2023-04-29 11:26:50,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +55: [2023-04-29 11:26:50,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +55: [2023-04-29 11:26:50,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +11: [2023-04-29 11:26:50,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:50,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +57: [2023-04-29 11:26:50,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 11:26:50,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +11: [2023-04-29 11:26:50,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +57: [2023-04-29 11:26:50,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 11:26:50,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 11:26:50,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 11:26:50,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 11:26:50,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 11:26:50,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +11: [2023-04-29 11:26:50,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 11:26:50,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:50,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:50,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:50,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 0: [2023-04-29 11:26:50,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 0: [2023-04-29 11:26:50,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 0: [2023-04-29 11:26:50,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +18: [2023-04-29 11:26:50,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 4: [2023-04-29 11:26:50,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +57: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +57: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +41: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +41: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +57: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +57: [2023-04-29 11:26:50,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +57: [2023-04-29 11:26:50,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 11:26:50,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 11:26:50,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 11:26:50,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +57: [2023-04-29 11:26:50,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +57: [2023-04-29 11:26:50,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +12: [2023-04-29 11:26:50,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 11:26:50,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:50,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +55: [2023-04-29 11:26:50,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +29: [2023-04-29 11:26:50,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +29: [2023-04-29 11:26:50,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +29: [2023-04-29 11:26:50,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +29: [2023-04-29 11:26:50,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 8: [2023-04-29 11:26:50,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 8: [2023-04-29 11:26:50,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 8: [2023-04-29 11:26:50,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +11: [2023-04-29 11:26:50,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +38: [2023-04-29 11:26:50,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 2: [2023-04-29 11:26:50,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +38: [2023-04-29 11:26:50,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 11:26:50,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +15: [2023-04-29 11:26:50,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +18: [2023-04-29 11:26:50,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +38: [2023-04-29 11:26:50,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 11:26:50,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +41: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +41: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +24: [2023-04-29 11:26:50,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 11:26:50,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +61: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +41: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +50: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +50: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 11:26:50,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 11:26:50,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +18: [2023-04-29 11:26:50,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +38: [2023-04-29 11:26:50,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 11:26:50,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 11:26:50,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +41: [2023-04-29 11:26:50,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +11: [2023-04-29 11:26:50,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +38: [2023-04-29 11:26:50,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +18: [2023-04-29 11:26:50,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +38: [2023-04-29 11:26:50,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 11:26:50,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +41: [2023-04-29 11:26:50,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 6: [2023-04-29 11:26:50,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +50: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +25: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +25: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +27: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +27: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +50: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +50: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +50: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +25: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +50: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +27: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +50: [2023-04-29 11:26:50,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +28: [2023-04-29 11:26:50,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +28: [2023-04-29 11:26:50,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 2: [2023-04-29 11:26:50,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +38: [2023-04-29 11:26:50,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +24: [2023-04-29 11:26:50,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +61: [2023-04-29 11:26:50,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +24: [2023-04-29 11:26:50,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +31: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +31: [2023-04-29 11:26:50,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +31: [2023-04-29 11:26:50,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +18: [2023-04-29 11:26:50,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +27: [2023-04-29 11:26:50,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +24: [2023-04-29 11:26:50,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +24: [2023-04-29 11:26:50,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +61: [2023-04-29 11:26:50,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +61: [2023-04-29 11:26:50,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +24: [2023-04-29 11:26:50,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +46: [2023-04-29 11:26:50,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 11:26:50,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +55: [2023-04-29 11:26:50,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +30: [2023-04-29 11:26:50,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +30: [2023-04-29 11:26:50,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +61: [2023-04-29 11:26:50,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +30: [2023-04-29 11:26:50,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +34: [2023-04-29 11:26:50,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +38: [2023-04-29 11:26:50,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +15: [2023-04-29 11:26:50,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +30: [2023-04-29 11:26:50,384] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +38: [2023-04-29 11:26:50,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +61: [2023-04-29 11:26:50,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +15: [2023-04-29 11:26:50,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 11:26:50,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +61: [2023-04-29 11:26:50,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +61: [2023-04-29 11:26:50,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +61: [2023-04-29 11:26:50,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +17: [2023-04-29 11:26:50,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +50: [2023-04-29 11:26:50,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +17: [2023-04-29 11:26:50,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +28: [2023-04-29 11:26:50,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +17: [2023-04-29 11:26:50,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +28: [2023-04-29 11:26:50,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +17: [2023-04-29 11:26:50,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 11:26:50,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +50: [2023-04-29 11:26:50,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +34: [2023-04-29 11:26:50,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +22: [2023-04-29 11:26:50,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 11:26:50,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +50: [2023-04-29 11:26:50,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +50: [2023-04-29 11:26:50,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +50: [2023-04-29 11:26:50,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +23: [2023-04-29 11:26:50,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +50: [2023-04-29 11:26:50,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +60: [2023-04-29 11:26:50,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +60: [2023-04-29 11:26:50,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +60: [2023-04-29 11:26:50,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +60: [2023-04-29 11:26:50,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +22: [2023-04-29 11:26:50,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +51: [2023-04-29 11:26:50,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +50: [2023-04-29 11:26:50,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +22: [2023-04-29 11:26:50,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +50: [2023-04-29 11:26:50,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +17: [2023-04-29 11:26:50,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 9: [2023-04-29 11:26:50,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +17: [2023-04-29 11:26:50,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +10: [2023-04-29 11:26:50,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 11:26:50,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 11:26:50,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 5: [2023-04-29 11:26:50,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +10: [2023-04-29 11:26:50,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 9: [2023-04-29 11:26:50,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 9: [2023-04-29 11:26:50,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 11:26:50,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +55: [2023-04-29 11:26:50,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +55: [2023-04-29 11:26:50,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 11:26:50,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 11:26:50,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +17: [2023-04-29 11:26:50,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +60: [2023-04-29 11:26:50,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 11:26:50,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 11:26:50,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 11:26:50,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 11:26:50,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +46: [2023-04-29 11:26:50,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 11:26:50,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 11:26:50,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +13: [2023-04-29 11:26:50,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +13: [2023-04-29 11:26:50,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +58: [2023-04-29 11:26:50,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +58: [2023-04-29 11:26:50,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +58: [2023-04-29 11:26:50,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +13: [2023-04-29 11:26:50,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +29: [2023-04-29 11:26:50,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 11:26:50,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +58: [2023-04-29 11:26:50,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +10: [2023-04-29 11:26:50,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +37: [2023-04-29 11:26:50,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 11:26:50,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 9: [2023-04-29 11:26:50,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +60: [2023-04-29 11:26:50,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +51: [2023-04-29 11:26:50,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,400] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 11:26:50,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 1: [2023-04-29 11:26:50,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +58: [2023-04-29 11:26:50,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +16: [2023-04-29 11:26:50,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +16: [2023-04-29 11:26:50,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +10: [2023-04-29 11:26:50,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +44: [2023-04-29 11:26:50,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +44: [2023-04-29 11:26:50,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +60: [2023-04-29 11:26:50,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +58: [2023-04-29 11:26:50,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 11:26:50,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 11:26:50,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 11:26:50,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +60: [2023-04-29 11:26:50,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +46: [2023-04-29 11:26:50,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +46: [2023-04-29 11:26:50,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 11:26:50,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 11:26:50,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 11:26:50,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 11:26:50,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 11:26:50,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 11:26:50,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 11:26:50,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +24: [2023-04-29 11:26:50,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 11:26:50,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +23: [2023-04-29 11:26:50,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +52: [2023-04-29 11:26:50,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +58: [2023-04-29 11:26:50,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +58: [2023-04-29 11:26:50,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 3: [2023-04-29 11:26:50,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +24: [2023-04-29 11:26:50,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 11:26:50,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +60: [2023-04-29 11:26:50,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +29: [2023-04-29 11:26:50,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 11:26:50,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 4: [2023-04-29 11:26:50,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 4: [2023-04-29 11:26:50,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +16: [2023-04-29 11:26:50,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +23: [2023-04-29 11:26:50,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +44: [2023-04-29 11:26:50,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +44: [2023-04-29 11:26:50,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +44: [2023-04-29 11:26:50,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +44: [2023-04-29 11:26:50,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +44: [2023-04-29 11:26:50,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +24: [2023-04-29 11:26:50,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +44: [2023-04-29 11:26:50,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +16: [2023-04-29 11:26:50,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +24: [2023-04-29 11:26:50,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +60: [2023-04-29 11:26:50,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 11:26:50,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 6: [2023-04-29 11:26:50,407] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +51: [2023-04-29 11:26:50,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 11:26:50,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +11: [2023-04-29 11:26:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +52: [2023-04-29 11:26:50,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 11:26:50,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +21: [2023-04-29 11:26:50,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 11:26:50,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +25: [2023-04-29 11:26:50,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +29: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +52: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 6: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +44: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +25: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +44: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +25: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +30: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +23: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 11:26:50,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +52: [2023-04-29 11:26:50,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +52: [2023-04-29 11:26:50,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +52: [2023-04-29 11:26:50,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +52: [2023-04-29 11:26:50,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +47: [2023-04-29 11:26:50,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +47: [2023-04-29 11:26:50,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +27: [2023-04-29 11:26:50,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 11:26:50,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +34: [2023-04-29 11:26:50,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 11:26:50,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +37: [2023-04-29 11:26:50,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +28: [2023-04-29 11:26:50,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 11:26:50,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 11:26:50,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 11:26:50,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +46: [2023-04-29 11:26:50,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +44: [2023-04-29 11:26:50,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +44: [2023-04-29 11:26:50,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +30: [2023-04-29 11:26:50,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 11:26:50,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 11:26:50,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +34: [2023-04-29 11:26:50,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +27: [2023-04-29 11:26:50,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +11: [2023-04-29 11:26:50,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +23: [2023-04-29 11:26:50,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 11:26:50,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 11:26:50,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 11:26:50,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +34: [2023-04-29 11:26:50,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +44: [2023-04-29 11:26:50,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +60: [2023-04-29 11:26:50,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +13: [2023-04-29 11:26:50,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 11:26:50,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 11:26:50,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +37: [2023-04-29 11:26:50,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +37: [2023-04-29 11:26:50,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +27: [2023-04-29 11:26:50,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +28: [2023-04-29 11:26:50,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +44: [2023-04-29 11:26:50,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +44: [2023-04-29 11:26:50,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +21: [2023-04-29 11:26:50,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +60: [2023-04-29 11:26:50,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +44: [2023-04-29 11:26:50,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +10: [2023-04-29 11:26:50,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +10: [2023-04-29 11:26:50,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +60: [2023-04-29 11:26:50,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +29: [2023-04-29 11:26:50,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 11:26:50,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 11:26:50,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 11:26:50,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 11:26:50,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 11:26:50,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +34: [2023-04-29 11:26:50,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +27: [2023-04-29 11:26:50,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 11:26:50,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +24: [2023-04-29 11:26:50,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 11:26:50,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 11:26:50,417] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +47: [2023-04-29 11:26:50,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +10: [2023-04-29 11:26:50,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 3: [2023-04-29 11:26:50,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 11:26:50,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +20: [2023-04-29 11:26:50,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 11:26:50,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 11:26:50,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 11:26:50,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 11:26:50,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 11:26:50,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +51: [2023-04-29 11:26:50,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +27: [2023-04-29 11:26:50,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 11:26:50,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +60: [2023-04-29 11:26:50,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +20: [2023-04-29 11:26:50,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 11:26:50,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +19: [2023-04-29 11:26:50,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 11:26:50,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +58: [2023-04-29 11:26:50,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +58: [2023-04-29 11:26:50,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +58: [2023-04-29 11:26:50,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +20: [2023-04-29 11:26:50,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +19: [2023-04-29 11:26:50,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 11:26:50,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 11:26:50,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +20: [2023-04-29 11:26:50,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +11: [2023-04-29 11:26:50,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 11:26:50,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +20: [2023-04-29 11:26:50,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 11:26:50,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +46: [2023-04-29 11:26:50,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 7: [2023-04-29 11:26:50,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +42: [2023-04-29 11:26:50,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 11:26:50,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 11:26:50,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 11:26:50,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 11:26:50,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 11:26:50,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 11:26:50,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 11:26:50,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +24: [2023-04-29 11:26:50,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 11:26:50,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 11:26:50,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 11:26:50,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 11:26:50,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +51: [2023-04-29 11:26:50,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +19: [2023-04-29 11:26:50,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +22: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +53: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +53: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +19: [2023-04-29 11:26:50,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +19: [2023-04-29 11:26:50,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +42: [2023-04-29 11:26:50,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +21: [2023-04-29 11:26:50,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 11:26:50,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +21: [2023-04-29 11:26:50,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +42: [2023-04-29 11:26:50,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +37: [2023-04-29 11:26:50,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +13: [2023-04-29 11:26:50,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +42: [2023-04-29 11:26:50,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 5: [2023-04-29 11:26:50,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +42: [2023-04-29 11:26:50,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 5: [2023-04-29 11:26:50,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +42: [2023-04-29 11:26:50,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +42: [2023-04-29 11:26:50,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... + 5: [2023-04-29 11:26:50,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 11:26:50,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +53: [2023-04-29 11:26:50,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +53: [2023-04-29 11:26:50,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +13: [2023-04-29 11:26:50,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +13: [2023-04-29 11:26:50,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +51: [2023-04-29 11:26:50,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 11:26:50,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +11: [2023-04-29 11:26:50,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +53: [2023-04-29 11:26:50,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +42: [2023-04-29 11:26:50,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +53: [2023-04-29 11:26:50,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +42: [2023-04-29 11:26:50,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 11:26:50,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 11:26:50,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +53: [2023-04-29 11:26:50,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +23: [2023-04-29 11:26:50,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +53: [2023-04-29 11:26:50,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +13: [2023-04-29 11:26:50,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +53: [2023-04-29 11:26:50,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +63: [2023-04-29 11:26:50,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 11:26:50,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +21: [2023-04-29 11:26:50,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +63: [2023-04-29 11:26:50,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 11:26:50,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 11:26:50,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +16: [2023-04-29 11:26:50,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 11:26:50,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +46: [2023-04-29 11:26:50,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 11:26:50,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +21: [2023-04-29 11:26:50,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +31: [2023-04-29 11:26:50,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +41: [2023-04-29 11:26:50,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +32: [2023-04-29 11:26:50,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. + 5: [2023-04-29 11:26:50,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +23: [2023-04-29 11:26:50,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 11:26:50,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +47: [2023-04-29 11:26:50,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 11:26:50,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +12: [2023-04-29 11:26:50,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +15: [2023-04-29 11:26:50,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +57: [2023-04-29 11:26:50,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +63: [2023-04-29 11:26:50,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +63: [2023-04-29 11:26:50,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 11:26:50,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:50,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 11:26:50,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 11:26:50,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +57: [2023-04-29 11:26:50,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +57: [2023-04-29 11:26:50,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +16: [2023-04-29 11:26:50,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 11:26:50,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +57: [2023-04-29 11:26:50,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +12: [2023-04-29 11:26:50,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +63: [2023-04-29 11:26:50,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +12: [2023-04-29 11:26:50,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 3: [2023-04-29 11:26:50,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +63: [2023-04-29 11:26:50,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +34: [2023-04-29 11:26:50,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 11:26:50,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:50,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 11:26:50,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 11:26:50,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 11:26:50,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 11:26:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. + 2: [2023-04-29 11:26:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 2: [2023-04-29 11:26:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 2: [2023-04-29 11:26:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 2: [2023-04-29 11:26:50,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +29: [2023-04-29 11:26:50,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 11:26:50,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +32: [2023-04-29 11:26:50,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +43: [2023-04-29 11:26:50,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 11:26:50,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 11:26:50,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:50,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 11:26:50,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +11: [2023-04-29 11:26:50,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +41: [2023-04-29 11:26:50,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +34: [2023-04-29 11:26:50,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 11:26:50,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 11:26:50,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +12: [2023-04-29 11:26:50,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:50,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +43: [2023-04-29 11:26:50,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 11:26:50,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +37: [2023-04-29 11:26:50,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +37: [2023-04-29 11:26:50,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:50,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 11:26:50,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +43: [2023-04-29 11:26:50,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 11:26:50,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 11:26:50,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 11:26:50,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 11:26:50,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +29: [2023-04-29 11:26:50,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +61: [2023-04-29 11:26:50,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 11:26:50,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +61: [2023-04-29 11:26:50,454] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +20: [2023-04-29 11:26:50,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 11:26:50,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 11:26:50,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 11:26:50,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 11:26:50,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 11:26:50,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 11:26:50,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 11:26:50,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +58: [2023-04-29 11:26:50,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +20: [2023-04-29 11:26:50,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 11:26:50,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 11:26:50,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 11:26:50,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +11: [2023-04-29 11:26:50,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 11:26:50,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 11:26:50,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +58: [2023-04-29 11:26:50,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +36: [2023-04-29 11:26:50,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +36: [2023-04-29 11:26:50,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +15: [2023-04-29 11:26:50,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 11:26:50,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +38: [2023-04-29 11:26:50,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +38: [2023-04-29 11:26:50,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +36: [2023-04-29 11:26:50,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +17: [2023-04-29 11:26:50,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +36: [2023-04-29 11:26:50,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +21: [2023-04-29 11:26:50,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +21: [2023-04-29 11:26:50,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +50: [2023-04-29 11:26:50,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +21: [2023-04-29 11:26:50,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +50: [2023-04-29 11:26:50,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 11:26:50,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +20: [2023-04-29 11:26:50,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +20: [2023-04-29 11:26:50,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +38: [2023-04-29 11:26:50,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +20: [2023-04-29 11:26:50,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +38: [2023-04-29 11:26:50,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 11:26:50,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 11:26:50,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +20: [2023-04-29 11:26:50,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +52: [2023-04-29 11:26:50,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +38: [2023-04-29 11:26:50,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +38: [2023-04-29 11:26:50,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +50: [2023-04-29 11:26:50,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 11:26:50,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 11:26:50,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +15: [2023-04-29 11:26:50,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 11:26:50,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +14: [2023-04-29 11:26:50,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +14: [2023-04-29 11:26:50,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 11:26:50,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:50,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +54: [2023-04-29 11:26:50,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 11:26:50,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 11:26:50,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 11:26:50,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 11:26:50,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 11:26:50,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +30: [2023-04-29 11:26:50,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +54: [2023-04-29 11:26:50,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 11:26:50,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +17: [2023-04-29 11:26:50,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +17: [2023-04-29 11:26:50,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 11:26:50,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 11:26:50,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 11:26:50,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +38: [2023-04-29 11:26:50,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +26: [2023-04-29 11:26:50,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:50,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +57: [2023-04-29 11:26:50,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +25: [2023-04-29 11:26:50,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 11:26:50,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +47: [2023-04-29 11:26:50,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +21: [2023-04-29 11:26:50,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +14: [2023-04-29 11:26:50,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +14: [2023-04-29 11:26:50,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +14: [2023-04-29 11:26:50,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +14: [2023-04-29 11:26:50,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +14: [2023-04-29 11:26:50,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +14: [2023-04-29 11:26:50,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +54: [2023-04-29 11:26:50,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 11:26:50,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 11:26:50,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 11:26:50,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +57: [2023-04-29 11:26:50,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 1: [2023-04-29 11:26:50,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 11:26:50,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 11:26:50,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 11:26:50,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +50: [2023-04-29 11:26:50,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +54: [2023-04-29 11:26:50,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 11:26:50,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 11:26:50,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +54: [2023-04-29 11:26:50,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 11:26:50,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +30: [2023-04-29 11:26:50,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +14: [2023-04-29 11:26:50,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 11:26:50,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +57: [2023-04-29 11:26:50,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 11:26:50,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +25: [2023-04-29 11:26:50,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +14: [2023-04-29 11:26:50,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +14: [2023-04-29 11:26:50,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +26: [2023-04-29 11:26:50,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 11:26:50,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 11:26:50,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 11:26:50,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +15: [2023-04-29 11:26:50,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +15: [2023-04-29 11:26:50,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +61: [2023-04-29 11:26:50,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +54: [2023-04-29 11:26:50,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +41: [2023-04-29 11:26:50,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +27: [2023-04-29 11:26:50,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 11:26:50,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +54: [2023-04-29 11:26:50,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +14: [2023-04-29 11:26:50,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +14: [2023-04-29 11:26:50,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +41: [2023-04-29 11:26:50,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +52: [2023-04-29 11:26:50,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +41: [2023-04-29 11:26:50,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +54: [2023-04-29 11:26:50,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 2: [2023-04-29 11:26:50,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 11:26:50,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +58: [2023-04-29 11:26:50,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +14: [2023-04-29 11:26:50,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 11:26:50,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +38: [2023-04-29 11:26:50,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +12: [2023-04-29 11:26:50,478] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +32: [2023-04-29 11:26:50,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 11:26:50,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +44: [2023-04-29 11:26:50,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +27: [2023-04-29 11:26:50,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 11:26:50,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +44: [2023-04-29 11:26:50,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +24: [2023-04-29 11:26:50,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +31: [2023-04-29 11:26:50,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +29: [2023-04-29 11:26:50,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +52: [2023-04-29 11:26:50,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +25: [2023-04-29 11:26:50,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 11:26:50,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 11:26:50,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +25: [2023-04-29 11:26:50,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +60: [2023-04-29 11:26:50,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 11:26:50,481] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +18: [2023-04-29 11:26:50,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +18: [2023-04-29 11:26:50,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +60: [2023-04-29 11:26:50,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 11:26:50,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 11:26:50,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 11:26:50,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +18: [2023-04-29 11:26:50,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +44: [2023-04-29 11:26:50,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +18: [2023-04-29 11:26:50,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 11:26:50,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +35: [2023-04-29 11:26:50,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 11:26:50,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +58: [2023-04-29 11:26:50,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +27: [2023-04-29 11:26:50,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 5: [2023-04-29 11:26:50,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +36: [2023-04-29 11:26:50,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +25: [2023-04-29 11:26:50,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +19: [2023-04-29 11:26:50,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +35: [2023-04-29 11:26:50,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 11:26:50,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +15: [2023-04-29 11:26:50,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +29: [2023-04-29 11:26:50,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +61: [2023-04-29 11:26:50,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 11:26:50,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 11:26:50,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 11:26:50,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +52: [2023-04-29 11:26:50,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +15: [2023-04-29 11:26:50,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +35: [2023-04-29 11:26:50,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +15: [2023-04-29 11:26:50,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +27: [2023-04-29 11:26:50,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 11:26:50,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 11:26:50,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 11:26:50,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +30: [2023-04-29 11:26:50,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +30: [2023-04-29 11:26:50,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +36: [2023-04-29 11:26:50,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +31: [2023-04-29 11:26:50,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 3: [2023-04-29 11:26:50,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +36: [2023-04-29 11:26:50,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +36: [2023-04-29 11:26:50,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +27: [2023-04-29 11:26:50,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 11:26:50,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 11:26:50,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 11:26:50,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +32: [2023-04-29 11:26:50,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +17: [2023-04-29 11:26:50,486] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +44: [2023-04-29 11:26:50,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +60: [2023-04-29 11:26:50,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +18: [2023-04-29 11:26:50,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +61: [2023-04-29 11:26:50,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +61: [2023-04-29 11:26:50,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +24: [2023-04-29 11:26:50,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +18: [2023-04-29 11:26:50,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 11:26:50,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 11:26:50,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 2: [2023-04-29 11:26:50,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +60: [2023-04-29 11:26:50,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +60: [2023-04-29 11:26:50,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +60: [2023-04-29 11:26:50,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +18: [2023-04-29 11:26:50,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +25: [2023-04-29 11:26:50,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +39: [2023-04-29 11:26:50,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 11:26:50,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +24: [2023-04-29 11:26:50,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +15: [2023-04-29 11:26:50,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +25: [2023-04-29 11:26:50,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +15: [2023-04-29 11:26:50,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 11:26:50,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +39: [2023-04-29 11:26:50,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 11:26:50,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +11: [2023-04-29 11:26:50,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 11:26:50,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 11:26:50,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 11:26:50,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +28: [2023-04-29 11:26:50,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +30: [2023-04-29 11:26:50,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 11:26:50,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +28: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +28: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +29: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +35: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +35: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +30: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +35: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +35: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +38: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +30: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 3: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 11:26:50,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 11:26:50,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +31: [2023-04-29 11:26:50,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 11:26:50,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +29: [2023-04-29 11:26:50,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +50: [2023-04-29 11:26:50,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 11:26:50,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +13: [2023-04-29 11:26:50,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +50: [2023-04-29 11:26:50,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +27: [2023-04-29 11:26:50,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +42: [2023-04-29 11:26:50,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +19: [2023-04-29 11:26:50,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +35: [2023-04-29 11:26:50,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +29: [2023-04-29 11:26:50,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +52: [2023-04-29 11:26:50,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 11:26:50,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +26: [2023-04-29 11:26:50,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +26: [2023-04-29 11:26:50,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +24: [2023-04-29 11:26:50,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +35: [2023-04-29 11:26:50,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +39: [2023-04-29 11:26:50,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 11:26:50,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 11:26:50,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +39: [2023-04-29 11:26:50,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 11:26:50,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt... +35: [2023-04-29 11:26:50,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt... +26: [2023-04-29 11:26:50,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +26: [2023-04-29 11:26:50,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. + 9: [2023-04-29 11:26:50,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 11:26:50,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +16: [2023-04-29 11:26:50,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +31: [2023-04-29 11:26:50,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +30: [2023-04-29 11:26:50,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +31: [2023-04-29 11:26:50,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +13: [2023-04-29 11:26:50,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +17: [2023-04-29 11:26:50,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +56: [2023-04-29 11:26:50,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 11:26:50,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +63: [2023-04-29 11:26:50,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 11:26:50,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +13: [2023-04-29 11:26:50,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +13: [2023-04-29 11:26:50,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +17: [2023-04-29 11:26:50,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +30: [2023-04-29 11:26:50,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 11:26:50,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +10: [2023-04-29 11:26:50,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +56: [2023-04-29 11:26:50,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +50: [2023-04-29 11:26:50,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +58: [2023-04-29 11:26:50,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +42: [2023-04-29 11:26:50,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +42: [2023-04-29 11:26:50,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +30: [2023-04-29 11:26:50,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +63: [2023-04-29 11:26:50,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +58: [2023-04-29 11:26:50,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +31: [2023-04-29 11:26:50,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +29: [2023-04-29 11:26:50,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +53: [2023-04-29 11:26:50,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +53: [2023-04-29 11:26:50,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +56: [2023-04-29 11:26:50,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +43: [2023-04-29 11:26:50,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 11:26:50,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 11:26:50,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 11:26:50,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 3: [2023-04-29 11:26:50,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 11:26:50,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +24: [2023-04-29 11:26:50,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 9: [2023-04-29 11:26:50,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 11:26:50,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +52: [2023-04-29 11:26:50,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +56: [2023-04-29 11:26:50,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 11:26:50,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 11:26:50,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +44: [2023-04-29 11:26:50,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +42: [2023-04-29 11:26:50,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +30: [2023-04-29 11:26:50,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 11:26:50,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +50: [2023-04-29 11:26:50,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 11:26:50,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +13: [2023-04-29 11:26:50,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +13: [2023-04-29 11:26:50,506] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +30: [2023-04-29 11:26:50,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +10: [2023-04-29 11:26:50,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 5: [2023-04-29 11:26:50,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 5: [2023-04-29 11:26:50,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +58: [2023-04-29 11:26:50,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 11:26:50,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +16: [2023-04-29 11:26:50,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 4: [2023-04-29 11:26:50,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +60: [2023-04-29 11:26:50,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +44: [2023-04-29 11:26:50,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +27: [2023-04-29 11:26:50,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +31: [2023-04-29 11:26:50,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +52: [2023-04-29 11:26:50,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +19: [2023-04-29 11:26:50,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 11:26:50,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +16: [2023-04-29 11:26:50,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +60: [2023-04-29 11:26:50,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +58: [2023-04-29 11:26:50,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +44: [2023-04-29 11:26:50,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +21: [2023-04-29 11:26:50,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +19: [2023-04-29 11:26:50,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 11:26:50,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +52: [2023-04-29 11:26:50,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 5: [2023-04-29 11:26:50,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 11:26:50,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +60: [2023-04-29 11:26:50,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 11:26:50,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 11:26:50,515] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +60: [2023-04-29 11:26:50,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +27: [2023-04-29 11:26:50,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +44: [2023-04-29 11:26:50,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +16: [2023-04-29 11:26:50,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 8: [2023-04-29 11:26:50,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 11:26:50,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +27: [2023-04-29 11:26:50,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 11:26:50,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 11:26:50,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +16: [2023-04-29 11:26:50,519] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +43: [2023-04-29 11:26:50,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +10: [2023-04-29 11:26:50,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +60: [2023-04-29 11:26:50,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 11:26:50,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +43: [2023-04-29 11:26:50,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +20: [2023-04-29 11:26:50,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +26: [2023-04-29 11:26:50,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +16: [2023-04-29 11:26:50,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +60: [2023-04-29 11:26:50,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 4: [2023-04-29 11:26:50,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 8: [2023-04-29 11:26:50,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +53: [2023-04-29 11:26:50,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 7: [2023-04-29 11:26:50,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 11:26:50,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +22: [2023-04-29 11:26:50,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +42: [2023-04-29 11:26:50,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +10: [2023-04-29 11:26:50,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +63: [2023-04-29 11:26:50,525] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +43: [2023-04-29 11:26:50,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 11:26:50,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +26: [2023-04-29 11:26:50,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +20: [2023-04-29 11:26:50,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +20: [2023-04-29 11:26:50,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +53: [2023-04-29 11:26:50,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 11:26:50,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +43: [2023-04-29 11:26:50,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 11:26:50,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_18-model_01-model_states.pt. +20: [2023-04-29 11:26:50,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 11:26:50,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 9: [2023-04-29 11:26:50,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 0: [2023-04-29 11:26:50,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +58: [2023-04-29 11:26:50,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +10: [2023-04-29 11:26:50,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +26: [2023-04-29 11:26:50,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +26: [2023-04-29 11:26:50,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +42: [2023-04-29 11:26:50,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +19: [2023-04-29 11:26:50,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +42: [2023-04-29 11:26:50,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +53: [2023-04-29 11:26:50,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 11:26:50,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +21: [2023-04-29 11:26:50,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +21: [2023-04-29 11:26:50,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +12: [2023-04-29 11:26:50,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +54: [2023-04-29 11:26:50,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +36: [2023-04-29 11:26:50,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 11:26:50,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 11:26:50,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 11:26:50,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +20: [2023-04-29 11:26:50,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +48: [2023-04-29 11:26:50,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 11:26:50,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +56: [2023-04-29 11:26:50,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +56: [2023-04-29 11:26:50,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. + 1: [2023-04-29 11:26:50,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +58: [2023-04-29 11:26:50,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +48: [2023-04-29 11:26:50,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 11:26:50,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +48: [2023-04-29 11:26:50,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +20: [2023-04-29 11:26:50,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +12: [2023-04-29 11:26:50,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +56: [2023-04-29 11:26:50,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. + 5: [2023-04-29 11:26:50,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +58: [2023-04-29 11:26:50,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 11:26:50,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +58: [2023-04-29 11:26:50,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 8: [2023-04-29 11:26:50,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +32: [2023-04-29 11:26:50,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +42: [2023-04-29 11:26:50,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +54: [2023-04-29 11:26:50,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 11:26:50,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 11:26:50,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 11:26:50,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 11:26:50,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 11:26:50,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +10: [2023-04-29 11:26:50,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 11:26:50,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +21: [2023-04-29 11:26:50,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +21: [2023-04-29 11:26:50,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 1: [2023-04-29 11:26:50,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +48: [2023-04-29 11:26:50,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +36: [2023-04-29 11:26:50,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 11:26:50,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +36: [2023-04-29 11:26:50,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +36: [2023-04-29 11:26:50,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +14: [2023-04-29 11:26:50,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +14: [2023-04-29 11:26:50,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:50,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:50,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +14: [2023-04-29 11:26:50,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:50,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +58: [2023-04-29 11:26:50,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 11:26:50,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +48: [2023-04-29 11:26:50,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 11:26:50,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +63: [2023-04-29 11:26:50,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +63: [2023-04-29 11:26:50,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +36: [2023-04-29 11:26:50,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +36: [2023-04-29 11:26:50,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +28: [2023-04-29 11:26:50,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 11:26:50,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 11:26:50,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 11:26:50,547] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +28: [2023-04-29 11:26:50,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +49: [2023-04-29 11:26:50,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 11:26:50,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 11:26:50,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +58: [2023-04-29 11:26:50,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 11:26:50,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +10: [2023-04-29 11:26:50,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +10: [2023-04-29 11:26:50,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 11:26:50,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 11:26:50,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 11:26:50,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +58: [2023-04-29 11:26:50,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +10: [2023-04-29 11:26:50,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +32: [2023-04-29 11:26:50,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 11:26:50,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:50,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 11:26:50,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +32: [2023-04-29 11:26:50,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 11:26:50,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +49: [2023-04-29 11:26:50,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. + 7: [2023-04-29 11:26:50,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 11:26:50,550] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +32: [2023-04-29 11:26:50,550] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +28: [2023-04-29 11:26:50,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +36: [2023-04-29 11:26:50,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +36: [2023-04-29 11:26:50,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +14: [2023-04-29 11:26:50,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +28: [2023-04-29 11:26:50,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +39: [2023-04-29 11:26:50,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 11:26:50,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +18: [2023-04-29 11:26:50,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 11:26:50,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +17: [2023-04-29 11:26:50,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +17: [2023-04-29 11:26:50,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +36: [2023-04-29 11:26:50,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 11:26:50,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. + 0: [2023-04-29 11:26:50,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +43: [2023-04-29 11:26:50,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +17: [2023-04-29 11:26:50,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +49: [2023-04-29 11:26:50,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +49: [2023-04-29 11:26:50,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +22: [2023-04-29 11:26:50,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +49: [2023-04-29 11:26:50,554] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 11:26:50,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 11:26:50,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +22: [2023-04-29 11:26:50,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +58: [2023-04-29 11:26:50,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +28: [2023-04-29 11:26:50,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 11:26:50,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +58: [2023-04-29 11:26:50,555] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +54: [2023-04-29 11:26:50,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +18: [2023-04-29 11:26:50,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +18: [2023-04-29 11:26:50,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +59: [2023-04-29 11:26:50,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +59: [2023-04-29 11:26:50,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +10: [2023-04-29 11:26:50,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +19: [2023-04-29 11:26:50,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +19: [2023-04-29 11:26:50,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +19: [2023-04-29 11:26:50,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +36: [2023-04-29 11:26:50,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +19: [2023-04-29 11:26:50,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +35: [2023-04-29 11:26:50,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +49: [2023-04-29 11:26:50,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +10: [2023-04-29 11:26:50,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 0: [2023-04-29 11:26:50,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 11:26:50,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +36: [2023-04-29 11:26:50,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +32: [2023-04-29 11:26:50,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +56: [2023-04-29 11:26:50,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +22: [2023-04-29 11:26:50,560] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +59: [2023-04-29 11:26:50,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +59: [2023-04-29 11:26:50,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +49: [2023-04-29 11:26:50,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +22: [2023-04-29 11:26:50,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt... +36: [2023-04-29 11:26:50,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +39: [2023-04-29 11:26:50,562] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +54: [2023-04-29 11:26:50,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +54: [2023-04-29 11:26:50,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +54: [2023-04-29 11:26:50,565] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 11:26:50,566] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +35: [2023-04-29 11:26:50,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +26: [2023-04-29 11:26:50,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +39: [2023-04-29 11:26:50,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 11:26:50,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +35: [2023-04-29 11:26:50,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_00-model_states.pt. +32: [2023-04-29 11:26:50,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 1: [2023-04-29 11:26:50,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +56: [2023-04-29 11:26:50,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 11:26:50,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 11:26:50,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 11:26:50,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +39: [2023-04-29 11:26:50,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 2: [2023-04-29 11:26:50,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 2: [2023-04-29 11:26:50,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... + 2: [2023-04-29 11:26:50,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +59: [2023-04-29 11:26:50,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 11:26:50,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 11:26:50,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 11:26:50,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +25: [2023-04-29 11:26:50,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 11:26:50,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +56: [2023-04-29 11:26:50,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +25: [2023-04-29 11:26:50,573] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +56: [2023-04-29 11:26:50,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +18: [2023-04-29 11:26:50,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +14: [2023-04-29 11:26:50,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +45: [2023-04-29 11:26:50,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +25: [2023-04-29 11:26:50,575] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +45: [2023-04-29 11:26:50,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +45: [2023-04-29 11:26:50,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +45: [2023-04-29 11:26:50,575] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:50,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +32: [2023-04-29 11:26:50,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +33: [2023-04-29 11:26:50,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +33: [2023-04-29 11:26:50,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. + 0: [2023-04-29 11:26:50,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +14: [2023-04-29 11:26:50,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 11:26:50,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +49: [2023-04-29 11:26:50,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 11:26:50,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +30: [2023-04-29 11:26:50,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 11:26:50,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 11:26:50,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 11:26:50,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 11:26:50,578] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 11:26:50,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +45: [2023-04-29 11:26:50,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 11:26:50,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +45: [2023-04-29 11:26:50,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +26: [2023-04-29 11:26:50,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 11:26:50,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 11:26:50,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +39: [2023-04-29 11:26:50,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +59: [2023-04-29 11:26:50,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 11:26:50,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +30: [2023-04-29 11:26:50,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +45: [2023-04-29 11:26:50,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +30: [2023-04-29 11:26:50,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 11:26:50,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +59: [2023-04-29 11:26:50,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +49: [2023-04-29 11:26:50,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +45: [2023-04-29 11:26:50,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 11:26:50,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 11:26:50,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 11:26:50,583] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 11:26:50,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +17: [2023-04-29 11:26:50,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 11:26:50,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 11:26:50,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 11:26:50,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +56: [2023-04-29 11:26:50,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 11:26:50,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 11:26:50,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +19: [2023-04-29 11:26:50,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +59: [2023-04-29 11:26:50,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +17: [2023-04-29 11:26:50,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +17: [2023-04-29 11:26:50,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 11:26:50,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +18: [2023-04-29 11:26:50,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +59: [2023-04-29 11:26:50,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 11:26:50,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +18: [2023-04-29 11:26:50,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 11:26:50,587] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +33: [2023-04-29 11:26:50,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 11:26:50,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 11:26:50,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 11:26:50,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +19: [2023-04-29 11:26:50,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +55: [2023-04-29 11:26:50,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 11:26:50,591] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 11:26:50,592] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 11:26:50,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +39: [2023-04-29 11:26:50,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +55: [2023-04-29 11:26:50,593] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +26: [2023-04-29 11:26:50,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +33: [2023-04-29 11:26:50,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 11:26:50,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 11:26:50,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +32: [2023-04-29 11:26:50,596] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +55: [2023-04-29 11:26:50,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 11:26:50,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 11:26:50,597] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +55: [2023-04-29 11:26:50,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 11:26:50,598] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 11:26:50,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +26: [2023-04-29 11:26:50,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +26: [2023-04-29 11:26:50,600] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +35: [2023-04-29 11:26:50,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 11:26:50,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 11:26:50,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 11:26:50,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 11:26:50,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +26: [2023-04-29 11:26:50,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +28: [2023-04-29 11:26:50,603] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +40: [2023-04-29 11:26:50,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 11:26:50,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 11:26:50,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +30: [2023-04-29 11:26:50,606] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +40: [2023-04-29 11:26:50,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 11:26:50,606] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,607] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 11:26:50,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +33: [2023-04-29 11:26:50,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 11:26:50,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +26: [2023-04-29 11:26:50,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +40: [2023-04-29 11:26:50,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +30: [2023-04-29 11:26:50,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +40: [2023-04-29 11:26:50,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 11:26:50,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 11:26:50,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:50,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +43: [2023-04-29 11:26:50,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +43: [2023-04-29 11:26:50,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +40: [2023-04-29 11:26:50,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:50,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +36: [2023-04-29 11:26:50,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 11:26:50,612] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 11:26:50,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +30: [2023-04-29 11:26:50,613] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +48: [2023-04-29 11:26:50,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 11:26:50,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 11:26:50,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 11:26:50,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +28: [2023-04-29 11:26:50,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +33: [2023-04-29 11:26:50,617] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 11:26:50,618] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +26: [2023-04-29 11:26:50,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 11:26:50,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +49: [2023-04-29 11:26:50,622] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +22: [2023-04-29 11:26:50,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +26: [2023-04-29 11:26:50,626] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +28: [2023-04-29 11:26:50,627] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +36: [2023-04-29 11:26:50,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +26: [2023-04-29 11:26:50,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +22: [2023-04-29 11:26:50,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +25: [2023-04-29 11:26:50,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +56: [2023-04-29 11:26:50,629] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 11:26:50,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 11:26:50,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +48: [2023-04-29 11:26:50,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +22: [2023-04-29 11:26:50,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +32: [2023-04-29 11:26:50,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 11:26:50,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 11:26:50,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 11:26:50,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +25: [2023-04-29 11:26:50,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,633] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +62: [2023-04-29 11:26:50,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 11:26:50,633] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 11:26:50,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +22: [2023-04-29 11:26:50,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +62: [2023-04-29 11:26:50,634] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +16: [2023-04-29 11:26:50,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 11:26:50,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 11:26:50,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 11:26:50,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 11:26:50,636] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_00-model_states.pt. +49: [2023-04-29 11:26:50,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 11:26:50,637] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 11:26:50,638] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 11:26:50,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 11:26:50,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +16: [2023-04-29 11:26:50,639] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +49: [2023-04-29 11:26:50,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 11:26:50,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 11:26:50,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 11:26:50,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 11:26:50,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +19: [2023-04-29 11:26:50,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +34: [2023-04-29 11:26:50,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 11:26:50,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +28: [2023-04-29 11:26:50,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +43: [2023-04-29 11:26:50,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +43: [2023-04-29 11:26:50,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +43: [2023-04-29 11:26:50,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +16: [2023-04-29 11:26:50,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +45: [2023-04-29 11:26:50,642] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 11:26:50,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 11:26:50,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +16: [2023-04-29 11:26:50,642] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:50,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 11:26:50,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +49: [2023-04-29 11:26:50,643] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 11:26:50,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +16: [2023-04-29 11:26:50,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +36: [2023-04-29 11:26:50,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +19: [2023-04-29 11:26:50,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +34: [2023-04-29 11:26:50,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +36: [2023-04-29 11:26:50,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +36: [2023-04-29 11:26:50,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 11:26:50,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 11:26:50,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +34: [2023-04-29 11:26:50,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 11:26:50,645] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +22: [2023-04-29 11:26:50,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt... +49: [2023-04-29 11:26:50,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 11:26:50,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +17: [2023-04-29 11:26:50,646] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +49: [2023-04-29 11:26:50,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 11:26:50,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +48: [2023-04-29 11:26:50,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +48: [2023-04-29 11:26:50,647] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +48: [2023-04-29 11:26:50,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +34: [2023-04-29 11:26:50,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 11:26:50,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +55: [2023-04-29 11:26:50,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +55: [2023-04-29 11:26:50,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +49: [2023-04-29 11:26:50,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 11:26:50,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 11:26:50,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +19: [2023-04-29 11:26:50,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +17: [2023-04-29 11:26:50,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +45: [2023-04-29 11:26:50,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +17: [2023-04-29 11:26:50,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 7: [2023-04-29 11:26:50,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,652] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +56: [2023-04-29 11:26:50,653] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +24: [2023-04-29 11:26:50,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 11:26:50,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 11:26:50,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 11:26:50,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +55: [2023-04-29 11:26:50,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +55: [2023-04-29 11:26:50,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +25: [2023-04-29 11:26:50,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 11:26:50,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +59: [2023-04-29 11:26:50,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 11:26:50,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +46: [2023-04-29 11:26:50,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +46: [2023-04-29 11:26:50,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +19: [2023-04-29 11:26:50,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 7: [2023-04-29 11:26:50,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +59: [2023-04-29 11:26:50,656] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +19: [2023-04-29 11:26:50,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +45: [2023-04-29 11:26:50,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 11:26:50,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 11:26:50,657] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +25: [2023-04-29 11:26:50,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +49: [2023-04-29 11:26:50,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +49: [2023-04-29 11:26:50,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +49: [2023-04-29 11:26:50,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +17: [2023-04-29 11:26:50,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +25: [2023-04-29 11:26:50,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 11:26:50,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 11:26:50,658] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +46: [2023-04-29 11:26:50,658] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +24: [2023-04-29 11:26:50,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +56: [2023-04-29 11:26:50,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 11:26:50,659] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +24: [2023-04-29 11:26:50,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +55: [2023-04-29 11:26:50,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +28: [2023-04-29 11:26:50,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +39: [2023-04-29 11:26:50,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +39: [2023-04-29 11:26:50,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +39: [2023-04-29 11:26:50,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +28: [2023-04-29 11:26:50,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +39: [2023-04-29 11:26:50,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +33: [2023-04-29 11:26:50,661] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 11:26:50,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +17: [2023-04-29 11:26:50,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +17: [2023-04-29 11:26:50,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +46: [2023-04-29 11:26:50,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +19: [2023-04-29 11:26:50,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +46: [2023-04-29 11:26:50,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +19: [2023-04-29 11:26:50,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +56: [2023-04-29 11:26:50,665] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +56: [2023-04-29 11:26:50,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +45: [2023-04-29 11:26:50,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 11:26:50,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 11:26:50,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +25: [2023-04-29 11:26:50,667] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +33: [2023-04-29 11:26:50,667] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 11:26:50,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 11:26:50,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +17: [2023-04-29 11:26:50,668] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +59: [2023-04-29 11:26:50,668] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 11:26:50,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 11:26:50,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 11:26:50,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +19: [2023-04-29 11:26:50,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +34: [2023-04-29 11:26:50,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +34: [2023-04-29 11:26:50,669] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +45: [2023-04-29 11:26:50,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 11:26:50,671] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +49: [2023-04-29 11:26:50,672] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +49: [2023-04-29 11:26:50,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 11:26:50,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +55: [2023-04-29 11:26:50,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 11:26:50,673] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +32: [2023-04-29 11:26:50,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 11:26:50,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 11:26:50,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 11:26:50,673] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 11:26:50,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +34: [2023-04-29 11:26:50,674] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +37: [2023-04-29 11:26:50,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +37: [2023-04-29 11:26:50,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +37: [2023-04-29 11:26:50,675] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +37: [2023-04-29 11:26:50,676] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. + 6: [2023-04-29 11:26:50,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +48: [2023-04-29 11:26:50,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 11:26:50,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,677] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 11:26:50,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 11:26:50,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +49: [2023-04-29 11:26:50,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 11:26:50,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 11:26:50,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +40: [2023-04-29 11:26:50,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 11:26:50,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 11:26:50,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,678] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +37: [2023-04-29 11:26:50,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 11:26:50,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 11:26:50,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +59: [2023-04-29 11:26:50,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +25: [2023-04-29 11:26:50,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 11:26:50,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 11:26:50,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +33: [2023-04-29 11:26:50,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 11:26:50,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 11:26:50,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 11:26:50,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +29: [2023-04-29 11:26:50,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 11:26:50,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 11:26:50,682] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 11:26:50,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 11:26:50,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +37: [2023-04-29 11:26:50,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 11:26:50,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +29: [2023-04-29 11:26:50,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 11:26:50,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 11:26:50,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 11:26:50,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 11:26:50,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +21: [2023-04-29 11:26:50,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +37: [2023-04-29 11:26:50,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 11:26:50,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +23: [2023-04-29 11:26:50,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 11:26:50,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +45: [2023-04-29 11:26:50,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 11:26:50,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +45: [2023-04-29 11:26:50,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 11:26:50,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 11:26:50,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +33: [2023-04-29 11:26:50,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +29: [2023-04-29 11:26:50,688] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 11:26:50,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 11:26:50,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 11:26:50,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +21: [2023-04-29 11:26:50,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 11:26:50,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +21: [2023-04-29 11:26:50,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +55: [2023-04-29 11:26:50,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +51: [2023-04-29 11:26:50,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +21: [2023-04-29 11:26:50,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +37: [2023-04-29 11:26:50,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +37: [2023-04-29 11:26:50,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +21: [2023-04-29 11:26:50,690] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +39: [2023-04-29 11:26:50,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 11:26:50,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 11:26:50,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +62: [2023-04-29 11:26:50,691] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 11:26:50,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +51: [2023-04-29 11:26:50,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +40: [2023-04-29 11:26:50,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 11:26:50,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +51: [2023-04-29 11:26:50,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +55: [2023-04-29 11:26:50,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 11:26:50,693] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 11:26:50,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +39: [2023-04-29 11:26:50,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 11:26:50,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 11:26:50,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 11:26:50,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 11:26:50,695] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 11:26:50,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 11:26:50,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 11:26:50,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 11:26:50,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 11:26:50,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,697] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +39: [2023-04-29 11:26:50,697] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 11:26:50,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 11:26:50,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,698] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 11:26:50,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +43: [2023-04-29 11:26:50,700] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 11:26:50,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 11:26:50,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 11:26:50,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 11:26:50,701] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 11:26:50,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +46: [2023-04-29 11:26:50,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +55: [2023-04-29 11:26:50,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 11:26:50,702] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +57: [2023-04-29 11:26:50,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 11:26:50,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 11:26:50,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 11:26:50,703] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,703] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +46: [2023-04-29 11:26:50,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +46: [2023-04-29 11:26:50,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +43: [2023-04-29 11:26:50,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +47: [2023-04-29 11:26:50,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 11:26:50,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 11:26:50,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +59: [2023-04-29 11:26:50,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 11:26:50,705] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 11:26:50,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 11:26:50,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +33: [2023-04-29 11:26:50,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 11:26:50,706] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 11:26:50,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 11:26:50,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +16: [2023-04-29 11:26:50,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +34: [2023-04-29 11:26:50,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 11:26:50,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +47: [2023-04-29 11:26:50,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +37: [2023-04-29 11:26:50,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +16: [2023-04-29 11:26:50,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +34: [2023-04-29 11:26:50,711] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 11:26:50,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 11:26:50,712] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 11:26:50,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 11:26:50,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +37: [2023-04-29 11:26:50,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:50,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 11:26:50,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 11:26:50,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +16: [2023-04-29 11:26:50,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +53: [2023-04-29 11:26:50,712] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 11:26:50,713] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 11:26:50,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 11:26:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +38: [2023-04-29 11:26:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 11:26:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 11:26:50,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +47: [2023-04-29 11:26:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +31: [2023-04-29 11:26:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 11:26:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 11:26:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 11:26:50,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +33: [2023-04-29 11:26:50,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +22: [2023-04-29 11:26:50,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 11:26:50,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +62: [2023-04-29 11:26:50,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 11:26:50,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +53: [2023-04-29 11:26:50,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 11:26:50,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 11:26:50,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +43: [2023-04-29 11:26:50,718] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +38: [2023-04-29 11:26:50,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +38: [2023-04-29 11:26:50,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +22: [2023-04-29 11:26:50,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 11:26:50,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 11:26:50,719] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 11:26:50,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 11:26:50,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 11:26:50,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +43: [2023-04-29 11:26:50,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +61: [2023-04-29 11:26:50,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +61: [2023-04-29 11:26:50,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +61: [2023-04-29 11:26:50,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +51: [2023-04-29 11:26:50,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 11:26:50,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +61: [2023-04-29 11:26:50,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +53: [2023-04-29 11:26:50,721] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 11:26:50,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +16: [2023-04-29 11:26:50,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +38: [2023-04-29 11:26:50,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +31: [2023-04-29 11:26:50,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +38: [2023-04-29 11:26:50,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +31: [2023-04-29 11:26:50,722] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +38: [2023-04-29 11:26:50,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +31: [2023-04-29 11:26:50,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 11:26:50,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +34: [2023-04-29 11:26:50,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +24: [2023-04-29 11:26:50,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +38: [2023-04-29 11:26:50,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +22: [2023-04-29 11:26:50,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 11:26:50,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 11:26:50,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +33: [2023-04-29 11:26:50,725] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 11:26:50,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +22: [2023-04-29 11:26:50,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +34: [2023-04-29 11:26:50,726] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 11:26:50,726] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +13: [2023-04-29 11:26:50,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 11:26:50,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +41: [2023-04-29 11:26:50,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 11:26:50,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +13: [2023-04-29 11:26:50,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 11:26:50,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 11:26:50,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +46: [2023-04-29 11:26:50,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +62: [2023-04-29 11:26:50,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +46: [2023-04-29 11:26:50,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +52: [2023-04-29 11:26:50,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +52: [2023-04-29 11:26:50,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 11:26:50,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 11:26:50,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +13: [2023-04-29 11:26:50,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +13: [2023-04-29 11:26:50,733] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +41: [2023-04-29 11:26:50,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 11:26:50,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 11:26:50,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 11:26:50,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +41: [2023-04-29 11:26:50,734] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +62: [2023-04-29 11:26:50,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 11:26:50,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +13: [2023-04-29 11:26:50,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +13: [2023-04-29 11:26:50,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +46: [2023-04-29 11:26:50,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +52: [2023-04-29 11:26:50,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +33: [2023-04-29 11:26:50,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... + 6: [2023-04-29 11:26:50,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +60: [2023-04-29 11:26:50,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +60: [2023-04-29 11:26:50,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 11:26:50,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +41: [2023-04-29 11:26:50,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +60: [2023-04-29 11:26:50,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +60: [2023-04-29 11:26:50,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 11:26:50,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +52: [2023-04-29 11:26:50,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +44: [2023-04-29 11:26:50,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +44: [2023-04-29 11:26:50,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +52: [2023-04-29 11:26:50,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +41: [2023-04-29 11:26:50,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +15: [2023-04-29 11:26:50,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +15: [2023-04-29 11:26:50,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +33: [2023-04-29 11:26:50,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +15: [2023-04-29 11:26:50,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 11:26:50,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 11:26:50,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +48: [2023-04-29 11:26:50,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 11:26:50,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 11:26:50,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 11:26:50,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +44: [2023-04-29 11:26:50,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +44: [2023-04-29 11:26:50,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +52: [2023-04-29 11:26:50,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +20: [2023-04-29 11:26:50,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 11:26:50,740] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +60: [2023-04-29 11:26:50,741] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 11:26:50,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +50: [2023-04-29 11:26:50,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +20: [2023-04-29 11:26:50,742] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 11:26:50,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 11:26:50,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +52: [2023-04-29 11:26:50,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 11:26:50,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 11:26:50,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 11:26:50,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +60: [2023-04-29 11:26:50,743] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 11:26:50,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +60: [2023-04-29 11:26:50,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 11:26:50,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +50: [2023-04-29 11:26:50,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 11:26:50,744] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +15: [2023-04-29 11:26:50,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 11:26:50,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 11:26:50,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +60: [2023-04-29 11:26:50,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 11:26:50,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +24: [2023-04-29 11:26:50,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 11:26:50,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +16: [2023-04-29 11:26:50,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +61: [2023-04-29 11:26:50,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +20: [2023-04-29 11:26:50,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +20: [2023-04-29 11:26:50,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +20: [2023-04-29 11:26:50,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +16: [2023-04-29 11:26:50,747] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +50: [2023-04-29 11:26:50,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +48: [2023-04-29 11:26:50,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 11:26:50,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +20: [2023-04-29 11:26:50,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +61: [2023-04-29 11:26:50,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 11:26:50,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 11:26:50,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +46: [2023-04-29 11:26:50,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +46: [2023-04-29 11:26:50,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +11: [2023-04-29 11:26:50,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 11:26:50,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +48: [2023-04-29 11:26:50,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 11:26:50,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +11: [2023-04-29 11:26:50,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +39: [2023-04-29 11:26:50,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +11: [2023-04-29 11:26:50,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +50: [2023-04-29 11:26:50,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +55: [2023-04-29 11:26:50,751] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +37: [2023-04-29 11:26:50,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +23: [2023-04-29 11:26:50,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 11:26:50,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 11:26:50,752] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +58: [2023-04-29 11:26:50,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +58: [2023-04-29 11:26:50,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +58: [2023-04-29 11:26:50,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +29: [2023-04-29 11:26:50,753] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +61: [2023-04-29 11:26:50,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +61: [2023-04-29 11:26:50,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +34: [2023-04-29 11:26:50,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +29: [2023-04-29 11:26:50,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +58: [2023-04-29 11:26:50,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 11:26:50,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +50: [2023-04-29 11:26:50,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +39: [2023-04-29 11:26:50,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +17: [2023-04-29 11:26:50,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 11:26:50,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +46: [2023-04-29 11:26:50,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +46: [2023-04-29 11:26:50,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 11:26:50,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +17: [2023-04-29 11:26:50,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +50: [2023-04-29 11:26:50,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +50: [2023-04-29 11:26:50,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +50: [2023-04-29 11:26:50,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +11: [2023-04-29 11:26:50,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 11:26:50,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +48: [2023-04-29 11:26:50,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +34: [2023-04-29 11:26:50,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 11:26:50,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +61: [2023-04-29 11:26:50,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +50: [2023-04-29 11:26:50,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +50: [2023-04-29 11:26:50,757] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +11: [2023-04-29 11:26:50,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +58: [2023-04-29 11:26:50,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 11:26:50,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. + 2: [2023-04-29 11:26:50,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 11:26:50,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +45: [2023-04-29 11:26:50,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +45: [2023-04-29 11:26:50,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +58: [2023-04-29 11:26:50,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 11:26:50,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. + 2: [2023-04-29 11:26:50,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +58: [2023-04-29 11:26:50,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +11: [2023-04-29 11:26:50,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 11:26:50,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 11:26:50,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 11:26:50,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +61: [2023-04-29 11:26:50,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +61: [2023-04-29 11:26:50,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +29: [2023-04-29 11:26:50,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +58: [2023-04-29 11:26:50,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +12: [2023-04-29 11:26:50,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 11:26:50,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 11:26:50,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 11:26:50,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 11:26:50,761] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 11:26:50,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +39: [2023-04-29 11:26:50,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 11:26:50,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +61: [2023-04-29 11:26:50,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +21: [2023-04-29 11:26:50,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +61: [2023-04-29 11:26:50,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +57: [2023-04-29 11:26:50,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +17: [2023-04-29 11:26:50,763] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 11:26:50,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 11:26:50,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +37: [2023-04-29 11:26:50,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +12: [2023-04-29 11:26:50,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +41: [2023-04-29 11:26:50,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +12: [2023-04-29 11:26:50,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +61: [2023-04-29 11:26:50,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +61: [2023-04-29 11:26:50,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 11:26:50,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 11:26:50,767] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 11:26:50,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +39: [2023-04-29 11:26:50,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... + 8: [2023-04-29 11:26:50,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +39: [2023-04-29 11:26:50,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +12: [2023-04-29 11:26:50,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +42: [2023-04-29 11:26:50,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +42: [2023-04-29 11:26:50,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +44: [2023-04-29 11:26:50,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +42: [2023-04-29 11:26:50,768] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +44: [2023-04-29 11:26:50,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +42: [2023-04-29 11:26:50,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +41: [2023-04-29 11:26:50,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 11:26:50,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +44: [2023-04-29 11:26:50,769] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 11:26:50,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 11:26:50,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +23: [2023-04-29 11:26:50,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +57: [2023-04-29 11:26:50,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +57: [2023-04-29 11:26:50,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +57: [2023-04-29 11:26:50,770] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +57: [2023-04-29 11:26:50,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +44: [2023-04-29 11:26:50,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +29: [2023-04-29 11:26:50,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +39: [2023-04-29 11:26:50,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,773] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 11:26:50,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 11:26:50,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +57: [2023-04-29 11:26:50,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +46: [2023-04-29 11:26:50,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 11:26:50,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +30: [2023-04-29 11:26:50,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +10: [2023-04-29 11:26:50,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 11:26:50,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 11:26:50,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 8: [2023-04-29 11:26:50,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +57: [2023-04-29 11:26:50,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +30: [2023-04-29 11:26:50,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +47: [2023-04-29 11:26:50,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 11:26:50,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 11:26:50,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +11: [2023-04-29 11:26:50,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +11: [2023-04-29 11:26:50,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +55: [2023-04-29 11:26:50,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +10: [2023-04-29 11:26:50,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 11:26:50,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +46: [2023-04-29 11:26:50,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +11: [2023-04-29 11:26:50,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +10: [2023-04-29 11:26:50,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +39: [2023-04-29 11:26:50,778] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +19: [2023-04-29 11:26:50,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 11:26:50,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 11:26:50,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 11:26:50,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 11:26:50,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 11:26:50,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 11:26:50,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 11:26:50,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +37: [2023-04-29 11:26:50,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 11:26:50,780] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 11:26:50,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 11:26:50,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +54: [2023-04-29 11:26:50,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +34: [2023-04-29 11:26:50,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 11:26:50,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 11:26:50,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 11:26:50,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 11:26:50,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +50: [2023-04-29 11:26:50,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 11:26:50,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +10: [2023-04-29 11:26:50,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +50: [2023-04-29 11:26:50,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +50: [2023-04-29 11:26:50,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +19: [2023-04-29 11:26:50,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +42: [2023-04-29 11:26:50,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +42: [2023-04-29 11:26:50,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +19: [2023-04-29 11:26:50,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +19: [2023-04-29 11:26:50,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +10: [2023-04-29 11:26:50,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +19: [2023-04-29 11:26:50,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +55: [2023-04-29 11:26:50,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +54: [2023-04-29 11:26:50,785] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 11:26:50,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 11:26:50,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 11:26:50,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 11:26:50,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +45: [2023-04-29 11:26:50,786] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +45: [2023-04-29 11:26:50,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 11:26:50,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +54: [2023-04-29 11:26:50,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 11:26:50,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +54: [2023-04-29 11:26:50,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +54: [2023-04-29 11:26:50,787] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 11:26:50,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +31: [2023-04-29 11:26:50,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +21: [2023-04-29 11:26:50,788] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +34: [2023-04-29 11:26:50,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +34: [2023-04-29 11:26:50,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +21: [2023-04-29 11:26:50,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 11:26:50,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +53: [2023-04-29 11:26:50,788] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 11:26:50,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 11:26:50,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 11:26:50,789] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 11:26:50,789] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 11:26:50,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +40: [2023-04-29 11:26:50,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +40: [2023-04-29 11:26:50,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +40: [2023-04-29 11:26:50,790] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +45: [2023-04-29 11:26:50,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +21: [2023-04-29 11:26:50,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +38: [2023-04-29 11:26:50,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +38: [2023-04-29 11:26:50,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 11:26:50,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +52: [2023-04-29 11:26:50,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +42: [2023-04-29 11:26:50,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 11:26:50,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +45: [2023-04-29 11:26:50,791] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +26: [2023-04-29 11:26:50,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 11:26:50,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 11:26:50,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 11:26:50,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +53: [2023-04-29 11:26:50,791] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 11:26:50,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +42: [2023-04-29 11:26:50,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +31: [2023-04-29 11:26:50,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 11:26:50,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 11:26:50,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +53: [2023-04-29 11:26:50,793] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +42: [2023-04-29 11:26:50,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +37: [2023-04-29 11:26:50,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 11:26:50,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 11:26:50,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 11:26:50,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +42: [2023-04-29 11:26:50,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +22: [2023-04-29 11:26:50,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 11:26:50,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +54: [2023-04-29 11:26:50,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 11:26:50,795] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 9: [2023-04-29 11:26:50,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +52: [2023-04-29 11:26:50,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +52: [2023-04-29 11:26:50,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +51: [2023-04-29 11:26:50,796] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 11:26:50,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +51: [2023-04-29 11:26:50,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 11:26:50,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +62: [2023-04-29 11:26:50,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. + 9: [2023-04-29 11:26:50,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +51: [2023-04-29 11:26:50,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... + 9: [2023-04-29 11:26:50,797] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +51: [2023-04-29 11:26:50,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +51: [2023-04-29 11:26:50,797] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +37: [2023-04-29 11:26:50,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +26: [2023-04-29 11:26:50,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 11:26:50,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 11:26:50,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +56: [2023-04-29 11:26:50,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 11:26:50,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:50,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +51: [2023-04-29 11:26:50,799] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 11:26:50,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:50,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 11:26:50,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +26: [2023-04-29 11:26:50,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +42: [2023-04-29 11:26:50,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +56: [2023-04-29 11:26:50,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +26: [2023-04-29 11:26:50,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +57: [2023-04-29 11:26:50,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +62: [2023-04-29 11:26:50,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +62: [2023-04-29 11:26:50,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +51: [2023-04-29 11:26:50,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +14: [2023-04-29 11:26:50,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 11:26:50,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +57: [2023-04-29 11:26:50,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +42: [2023-04-29 11:26:50,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +42: [2023-04-29 11:26:50,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 11:26:50,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +42: [2023-04-29 11:26:50,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,801] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +34: [2023-04-29 11:26:50,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +60: [2023-04-29 11:26:50,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 11:26:50,802] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 11:26:50,802] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +14: [2023-04-29 11:26:50,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 11:26:50,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +14: [2023-04-29 11:26:50,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 11:26:50,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 11:26:50,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 11:26:50,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 11:26:50,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 11:26:50,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +57: [2023-04-29 11:26:50,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +13: [2023-04-29 11:26:50,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 11:26:50,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +34: [2023-04-29 11:26:50,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +56: [2023-04-29 11:26:50,804] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 11:26:50,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 11:26:50,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 11:26:50,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +44: [2023-04-29 11:26:50,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 11:26:50,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 11:26:50,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +30: [2023-04-29 11:26:50,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +44: [2023-04-29 11:26:50,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +30: [2023-04-29 11:26:50,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 11:26:50,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 11:26:50,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 11:26:50,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +15: [2023-04-29 11:26:50,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +51: [2023-04-29 11:26:50,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +14: [2023-04-29 11:26:50,808] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 11:26:50,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +46: [2023-04-29 11:26:50,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 11:26:50,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +15: [2023-04-29 11:26:50,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +47: [2023-04-29 11:26:50,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +52: [2023-04-29 11:26:50,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +14: [2023-04-29 11:26:50,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +57: [2023-04-29 11:26:50,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 11:26:50,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +51: [2023-04-29 11:26:50,809] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +41: [2023-04-29 11:26:50,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 11:26:50,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 11:26:50,810] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +13: [2023-04-29 11:26:50,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 11:26:50,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +47: [2023-04-29 11:26:50,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +15: [2023-04-29 11:26:50,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +15: [2023-04-29 11:26:50,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +44: [2023-04-29 11:26:50,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +61: [2023-04-29 11:26:50,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 11:26:50,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +46: [2023-04-29 11:26:50,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +20: [2023-04-29 11:26:50,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 1: [2023-04-29 11:26:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 1: [2023-04-29 11:26:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +44: [2023-04-29 11:26:50,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +38: [2023-04-29 11:26:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +38: [2023-04-29 11:26:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. + 1: [2023-04-29 11:26:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +37: [2023-04-29 11:26:50,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 11:26:50,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +44: [2023-04-29 11:26:50,815] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +52: [2023-04-29 11:26:50,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 11:26:50,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +47: [2023-04-29 11:26:50,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +50: [2023-04-29 11:26:50,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +11: [2023-04-29 11:26:50,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +38: [2023-04-29 11:26:50,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 11:26:50,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +60: [2023-04-29 11:26:50,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +60: [2023-04-29 11:26:50,816] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +11: [2023-04-29 11:26:50,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 11:26:50,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 11:26:50,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +20: [2023-04-29 11:26:50,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 11:26:50,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 11:26:50,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +47: [2023-04-29 11:26:50,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +37: [2023-04-29 11:26:50,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +61: [2023-04-29 11:26:50,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +52: [2023-04-29 11:26:50,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +41: [2023-04-29 11:26:50,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +31: [2023-04-29 11:26:50,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +40: [2023-04-29 11:26:50,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 11:26:50,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 11:26:50,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +60: [2023-04-29 11:26:50,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 11:26:50,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 11:26:50,819] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +46: [2023-04-29 11:26:50,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +46: [2023-04-29 11:26:50,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +52: [2023-04-29 11:26:50,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 11:26:50,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +40: [2023-04-29 11:26:50,820] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +61: [2023-04-29 11:26:50,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +37: [2023-04-29 11:26:50,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 11:26:50,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 11:26:50,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +47: [2023-04-29 11:26:50,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 11:26:50,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 11:26:50,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +31: [2023-04-29 11:26:50,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 11:26:50,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 11:26:50,823] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +37: [2023-04-29 11:26:50,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +11: [2023-04-29 11:26:50,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +37: [2023-04-29 11:26:50,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +53: [2023-04-29 11:26:50,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 11:26:50,824] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 11:26:50,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 11:26:50,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +58: [2023-04-29 11:26:50,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 11:26:50,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +47: [2023-04-29 11:26:50,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +22: [2023-04-29 11:26:50,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 11:26:50,825] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +60: [2023-04-29 11:26:50,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 11:26:50,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 11:26:50,826] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +46: [2023-04-29 11:26:50,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +62: [2023-04-29 11:26:50,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 11:26:50,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +61: [2023-04-29 11:26:50,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +47: [2023-04-29 11:26:50,826] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +52: [2023-04-29 11:26:50,827] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +62: [2023-04-29 11:26:50,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 11:26:50,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +17: [2023-04-29 11:26:50,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +58: [2023-04-29 11:26:50,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 11:26:50,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 11:26:50,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 11:26:50,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 11:26:50,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +36: [2023-04-29 11:26:50,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +61: [2023-04-29 11:26:50,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +61: [2023-04-29 11:26:50,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +58: [2023-04-29 11:26:50,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +17: [2023-04-29 11:26:50,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +17: [2023-04-29 11:26:50,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +58: [2023-04-29 11:26:50,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 11:26:50,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +61: [2023-04-29 11:26:50,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +12: [2023-04-29 11:26:50,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 11:26:50,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +35: [2023-04-29 11:26:50,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +35: [2023-04-29 11:26:50,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +13: [2023-04-29 11:26:50,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 11:26:50,835] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +50: [2023-04-29 11:26:50,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +50: [2023-04-29 11:26:50,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +36: [2023-04-29 11:26:50,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +41: [2023-04-29 11:26:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +15: [2023-04-29 11:26:50,837] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +44: [2023-04-29 11:26:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +12: [2023-04-29 11:26:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 11:26:50,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 11:26:50,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 11:26:50,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +41: [2023-04-29 11:26:50,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +36: [2023-04-29 11:26:50,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 11:26:50,838] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +36: [2023-04-29 11:26:50,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 11:26:50,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +63: [2023-04-29 11:26:50,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +63: [2023-04-29 11:26:50,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +36: [2023-04-29 11:26:50,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 2: [2023-04-29 11:26:50,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 11:26:50,839] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +63: [2023-04-29 11:26:50,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 11:26:50,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 11:26:50,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 11:26:50,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 11:26:50,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +47: [2023-04-29 11:26:50,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 11:26:50,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. + 1: [2023-04-29 11:26:50,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +44: [2023-04-29 11:26:50,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +13: [2023-04-29 11:26:50,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +52: [2023-04-29 11:26:50,841] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 11:26:50,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +61: [2023-04-29 11:26:50,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +35: [2023-04-29 11:26:50,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 11:26:50,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 11:26:50,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +20: [2023-04-29 11:26:50,842] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 11:26:50,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +35: [2023-04-29 11:26:50,842] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 11:26:50,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +54: [2023-04-29 11:26:50,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +54: [2023-04-29 11:26:50,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. + 1: [2023-04-29 11:26:50,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +41: [2023-04-29 11:26:50,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +15: [2023-04-29 11:26:50,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +63: [2023-04-29 11:26:50,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 11:26:50,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +19: [2023-04-29 11:26:50,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:50,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 11:26:50,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 11:26:50,844] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +61: [2023-04-29 11:26:50,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +38: [2023-04-29 11:26:50,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 11:26:50,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 11:26:50,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 11:26:50,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 11:26:50,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +63: [2023-04-29 11:26:50,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +63: [2023-04-29 11:26:50,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:50,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +54: [2023-04-29 11:26:50,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +44: [2023-04-29 11:26:50,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +54: [2023-04-29 11:26:50,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +44: [2023-04-29 11:26:50,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +47: [2023-04-29 11:26:50,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +10: [2023-04-29 11:26:50,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +44: [2023-04-29 11:26:50,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +52: [2023-04-29 11:26:50,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +20: [2023-04-29 11:26:50,847] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +38: [2023-04-29 11:26:50,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 11:26:50,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +20: [2023-04-29 11:26:50,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +60: [2023-04-29 11:26:50,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 11:26:50,847] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 11:26:50,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +60: [2023-04-29 11:26:50,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +35: [2023-04-29 11:26:50,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +50: [2023-04-29 11:26:50,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 11:26:50,850] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +19: [2023-04-29 11:26:50,850] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +41: [2023-04-29 11:26:50,851] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +15: [2023-04-29 11:26:50,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +15: [2023-04-29 11:26:50,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +15: [2023-04-29 11:26:50,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +35: [2023-04-29 11:26:50,852] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +15: [2023-04-29 11:26:50,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +35: [2023-04-29 11:26:50,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +41: [2023-04-29 11:26:50,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +50: [2023-04-29 11:26:50,853] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 9: [2023-04-29 11:26:50,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +60: [2023-04-29 11:26:50,854] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:50,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +52: [2023-04-29 11:26:50,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +19: [2023-04-29 11:26:50,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 11:26:50,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +50: [2023-04-29 11:26:50,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +10: [2023-04-29 11:26:50,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +45: [2023-04-29 11:26:50,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +17: [2023-04-29 11:26:50,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +53: [2023-04-29 11:26:50,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +53: [2023-04-29 11:26:50,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +58: [2023-04-29 11:26:50,857] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 11:26:50,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 11:26:50,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +53: [2023-04-29 11:26:50,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_41-model_01-model_states.pt. +50: [2023-04-29 11:26:50,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +50: [2023-04-29 11:26:50,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 6: [2023-04-29 11:26:50,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 6: [2023-04-29 11:26:50,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +17: [2023-04-29 11:26:50,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +54: [2023-04-29 11:26:50,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +54: [2023-04-29 11:26:50,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 11:26:50,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +48: [2023-04-29 11:26:50,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 11:26:50,859] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 11:26:50,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 5: [2023-04-29 11:26:50,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +61: [2023-04-29 11:26:50,860] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +41: [2023-04-29 11:26:50,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +61: [2023-04-29 11:26:50,861] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 11:26:50,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 11:26:50,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +45: [2023-04-29 11:26:50,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +11: [2023-04-29 11:26:50,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 11:26:50,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +45: [2023-04-29 11:26:50,862] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +10: [2023-04-29 11:26:50,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +49: [2023-04-29 11:26:50,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 11:26:50,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 11:26:50,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 11:26:50,864] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +50: [2023-04-29 11:26:50,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +45: [2023-04-29 11:26:50,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +57: [2023-04-29 11:26:50,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 11:26:50,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,865] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +11: [2023-04-29 11:26:50,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 11:26:50,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 0: [2023-04-29 11:26:50,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 0: [2023-04-29 11:26:50,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 7: [2023-04-29 11:26:50,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +45: [2023-04-29 11:26:50,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 11:26:50,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +58: [2023-04-29 11:26:50,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +26: [2023-04-29 11:26:50,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 11:26:50,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 11:26:50,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +45: [2023-04-29 11:26:50,867] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 9: [2023-04-29 11:26:50,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +49: [2023-04-29 11:26:50,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 11:26:50,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:50,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +49: [2023-04-29 11:26:50,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 11:26:50,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +17: [2023-04-29 11:26:50,868] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 11:26:50,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 11:26:50,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +50: [2023-04-29 11:26:50,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 11:26:50,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +17: [2023-04-29 11:26:50,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +11: [2023-04-29 11:26:50,869] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +26: [2023-04-29 11:26:50,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 11:26:50,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +58: [2023-04-29 11:26:50,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,869] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 11:26:50,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +54: [2023-04-29 11:26:50,870] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +58: [2023-04-29 11:26:50,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 11:26:50,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 11:26:50,870] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 11:26:50,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 11:26:50,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 11:26:50,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +35: [2023-04-29 11:26:50,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +57: [2023-04-29 11:26:50,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +57: [2023-04-29 11:26:50,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +57: [2023-04-29 11:26:50,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +26: [2023-04-29 11:26:50,871] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +14: [2023-04-29 11:26:50,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 11:26:50,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 8: [2023-04-29 11:26:50,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +42: [2023-04-29 11:26:50,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +45: [2023-04-29 11:26:50,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 0: [2023-04-29 11:26:50,901] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +61: [2023-04-29 11:26:50,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 11:26:50,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +63: [2023-04-29 11:26:50,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +57: [2023-04-29 11:26:50,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +59: [2023-04-29 11:26:50,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 11:26:50,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 11:26:50,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +10: [2023-04-29 11:26:50,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 8: [2023-04-29 11:26:50,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 11:26:50,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +18: [2023-04-29 11:26:50,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +25: [2023-04-29 11:26:50,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +25: [2023-04-29 11:26:50,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +15: [2023-04-29 11:26:50,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 11:26:50,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +12: [2023-04-29 11:26:50,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +38: [2023-04-29 11:26:50,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +38: [2023-04-29 11:26:50,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +54: [2023-04-29 11:26:50,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +42: [2023-04-29 11:26:50,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 2: [2023-04-29 11:26:50,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt... + 2: [2023-04-29 11:26:50,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt... + 2: [2023-04-29 11:26:50,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt... +39: [2023-04-29 11:26:50,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +39: [2023-04-29 11:26:50,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,882] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +49: [2023-04-29 11:26:50,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +56: [2023-04-29 11:26:50,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +44: [2023-04-29 11:26:50,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +14: [2023-04-29 11:26:50,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 4: [2023-04-29 11:26:50,907] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +36: [2023-04-29 11:26:50,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 11:26:50,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +30: [2023-04-29 11:26:50,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +52: [2023-04-29 11:26:50,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 11:26:50,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 11:26:50,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +11: [2023-04-29 11:26:50,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt... +45: [2023-04-29 11:26:50,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +50: [2023-04-29 11:26:50,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 11:26:50,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 11:26:50,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 11:26:50,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 11:26:50,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +23: [2023-04-29 11:26:50,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 0: [2023-04-29 11:26:50,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +61: [2023-04-29 11:26:50,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 11:26:50,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +63: [2023-04-29 11:26:50,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +63: [2023-04-29 11:26:50,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +57: [2023-04-29 11:26:50,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +59: [2023-04-29 11:26:50,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +10: [2023-04-29 11:26:50,895] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 8: [2023-04-29 11:26:50,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 11:26:50,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +25: [2023-04-29 11:26:50,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +15: [2023-04-29 11:26:50,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 11:26:50,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +38: [2023-04-29 11:26:50,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +54: [2023-04-29 11:26:50,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +42: [2023-04-29 11:26:50,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 2: [2023-04-29 11:26:50,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt... +39: [2023-04-29 11:26:50,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +49: [2023-04-29 11:26:50,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +56: [2023-04-29 11:26:50,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 11:26:50,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +44: [2023-04-29 11:26:50,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +14: [2023-04-29 11:26:50,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +30: [2023-04-29 11:26:50,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 9: [2023-04-29 11:26:50,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 11:26:50,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +23: [2023-04-29 11:26:50,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 0: [2023-04-29 11:26:50,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +63: [2023-04-29 11:26:50,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +57: [2023-04-29 11:26:50,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +59: [2023-04-29 11:26:50,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 11:26:50,896] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 8: [2023-04-29 11:26:50,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 11:26:50,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +25: [2023-04-29 11:26:50,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +15: [2023-04-29 11:26:50,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 11:26:50,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 11:26:50,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +54: [2023-04-29 11:26:50,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +42: [2023-04-29 11:26:50,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 11:26:50,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,883] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 11:26:50,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +56: [2023-04-29 11:26:50,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 11:26:50,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +14: [2023-04-29 11:26:50,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,913] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +36: [2023-04-29 11:26:50,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 11:26:50,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +30: [2023-04-29 11:26:50,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +30: [2023-04-29 11:26:50,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +52: [2023-04-29 11:26:50,900] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 11:26:50,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +11: [2023-04-29 11:26:50,912] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt... + 6: [2023-04-29 11:26:50,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 11:26:50,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 11:26:50,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +63: [2023-04-29 11:26:50,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +57: [2023-04-29 11:26:50,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +59: [2023-04-29 11:26:50,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 11:26:50,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 8: [2023-04-29 11:26:50,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 11:26:50,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +38: [2023-04-29 11:26:50,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +54: [2023-04-29 11:26:50,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +42: [2023-04-29 11:26:50,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 11:26:50,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,900] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 1: [2023-04-29 11:26:50,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +56: [2023-04-29 11:26:50,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 11:26:50,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +14: [2023-04-29 11:26:50,898] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +36: [2023-04-29 11:26:50,914] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +30: [2023-04-29 11:26:50,880] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 9: [2023-04-29 11:26:50,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +52: [2023-04-29 11:26:50,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 11:26:50,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 11:26:50,881] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +11: [2023-04-29 11:26:50,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt... + 6: [2023-04-29 11:26:50,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 11:26:50,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +63: [2023-04-29 11:26:50,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 11:26:50,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 11:26:50,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt... +10: [2023-04-29 11:26:50,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt... + 8: [2023-04-29 11:26:50,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +54: [2023-04-29 11:26:50,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 11:26:50,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +39: [2023-04-29 11:26:50,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,888] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +56: [2023-04-29 11:26:50,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 11:26:50,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +14: [2023-04-29 11:26:50,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 11:26:50,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +52: [2023-04-29 11:26:50,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +43: [2023-04-29 11:26:50,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +11: [2023-04-29 11:26:50,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 11:26:50,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +63: [2023-04-29 11:26:50,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 11:26:50,899] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +54: [2023-04-29 11:26:50,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 11:26:50,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 11:26:50,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +56: [2023-04-29 11:26:50,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 11:26:50,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +30: [2023-04-29 11:26:50,882] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +52: [2023-04-29 11:26:50,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +43: [2023-04-29 11:26:50,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +11: [2023-04-29 11:26:50,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt... +10: [2023-04-29 11:26:50,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt... + 8: [2023-04-29 11:26:50,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +54: [2023-04-29 11:26:50,895] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 11:26:50,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +39: [2023-04-29 11:26:50,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 11:26:50,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +52: [2023-04-29 11:26:50,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +10: [2023-04-29 11:26:50,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt... +54: [2023-04-29 11:26:50,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 11:26:50,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +44: [2023-04-29 11:26:50,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 11:26:50,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 11:26:50,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +40: [2023-04-29 11:26:50,893] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +52: [2023-04-29 11:26:50,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +53: [2023-04-29 11:26:50,887] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +10: [2023-04-29 11:26:50,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +42: [2023-04-29 11:26:50,884] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +44: [2023-04-29 11:26:50,921] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 11:26:50,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +52: [2023-04-29 11:26:50,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +53: [2023-04-29 11:26:50,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +53: [2023-04-29 11:26:50,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt... +42: [2023-04-29 11:26:50,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +40: [2023-04-29 11:26:50,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +40: [2023-04-29 11:26:50,905] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +62: [2023-04-29 11:26:50,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:50,903] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 11:26:50,907] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +62: [2023-04-29 11:26:50,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:50,908] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 11:26:50,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +62: [2023-04-29 11:26:50,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +62: [2023-04-29 11:26:50,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +42: [2023-04-29 11:26:50,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 11:26:50,909] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +48: [2023-04-29 11:26:50,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:50,917] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 11:26:50,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 11:26:50,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 11:26:50,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 11:26:50,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 11:26:50,921] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 11:26:50,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 11:26:50,922] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 11:26:50,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +38: [2023-04-29 11:26:50,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +27: [2023-04-29 11:26:50,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +36: [2023-04-29 11:26:50,924] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 11:26:50,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +14: [2023-04-29 11:26:50,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +14: [2023-04-29 11:26:50,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +14: [2023-04-29 11:26:50,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +14: [2023-04-29 11:26:50,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +11: [2023-04-29 11:26:50,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 0: [2023-04-29 11:26:50,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +38: [2023-04-29 11:26:50,926] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +10: [2023-04-29 11:26:50,927] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 11:26:50,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +17: [2023-04-29 11:26:50,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 0: [2023-04-29 11:26:50,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:50,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 11:26:50,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 11:26:50,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 11:26:50,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +19: [2023-04-29 11:26:50,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt... +19: [2023-04-29 11:26:50,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt... +19: [2023-04-29 11:26:50,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt... +19: [2023-04-29 11:26:50,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt... +18: [2023-04-29 11:26:50,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 11:26:50,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 11:26:50,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +27: [2023-04-29 11:26:50,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +27: [2023-04-29 11:26:50,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +32: [2023-04-29 11:26:50,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +18: [2023-04-29 11:26:50,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 11:26:50,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +25: [2023-04-29 11:26:50,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +32: [2023-04-29 11:26:50,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +14: [2023-04-29 11:26:50,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +32: [2023-04-29 11:26:50,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 11:26:50,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +11: [2023-04-29 11:26:50,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +35: [2023-04-29 11:26:50,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +49: [2023-04-29 11:26:50,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 11:26:50,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 11:26:50,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 0: [2023-04-29 11:26:50,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 11:26:50,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 11:26:50,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +25: [2023-04-29 11:26:50,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 11:26:50,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 11:26:50,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +23: [2023-04-29 11:26:50,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +63: [2023-04-29 11:26:50,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 9: [2023-04-29 11:26:50,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +12: [2023-04-29 11:26:50,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 11:26:50,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 11:26:50,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +23: [2023-04-29 11:26:50,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,936] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +33: [2023-04-29 11:26:50,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 11:26:50,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 11:26:50,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 11:26:50,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +11: [2023-04-29 11:26:50,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +48: [2023-04-29 11:26:50,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 11:26:50,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +35: [2023-04-29 11:26:50,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +45: [2023-04-29 11:26:50,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +45: [2023-04-29 11:26:50,937] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +45: [2023-04-29 11:26:50,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +31: [2023-04-29 11:26:50,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +31: [2023-04-29 11:26:50,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +31: [2023-04-29 11:26:50,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +49: [2023-04-29 11:26:50,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +33: [2023-04-29 11:26:50,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +31: [2023-04-29 11:26:50,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +23: [2023-04-29 11:26:50,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,938] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +63: [2023-04-29 11:26:50,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +11: [2023-04-29 11:26:50,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +40: [2023-04-29 11:26:50,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 11:26:50,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 11:26:50,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,939] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +40: [2023-04-29 11:26:50,939] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +33: [2023-04-29 11:26:50,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 11:26:50,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 11:26:50,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 11:26:50,942] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +40: [2023-04-29 11:26:50,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 11:26:50,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 11:26:50,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +15: [2023-04-29 11:26:50,943] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +40: [2023-04-29 11:26:50,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 11:26:50,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 11:26:50,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 11:26:50,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +63: [2023-04-29 11:26:50,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 11:26:50,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 11:26:50,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 11:26:50,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 11:26:50,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 11:26:50,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 3: [2023-04-29 11:26:50,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +11: [2023-04-29 11:26:50,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +35: [2023-04-29 11:26:50,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +35: [2023-04-29 11:26:50,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 11:26:50,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +43: [2023-04-29 11:26:50,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 11:26:50,946] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 11:26:50,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 11:26:50,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 7: [2023-04-29 11:26:50,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +40: [2023-04-29 11:26:50,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +36: [2023-04-29 11:26:50,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 11:26:50,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 11:26:50,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +15: [2023-04-29 11:26:50,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +49: [2023-04-29 11:26:50,949] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 11:26:50,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +14: [2023-04-29 11:26:50,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +55: [2023-04-29 11:26:50,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 11:26:50,950] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 3: [2023-04-29 11:26:50,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +63: [2023-04-29 11:26:50,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 11:26:50,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 11:26:50,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 11:26:50,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 11:26:50,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +55: [2023-04-29 11:26:50,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 11:26:50,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 11:26:50,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 11:26:50,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +48: [2023-04-29 11:26:50,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 11:26:50,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +19: [2023-04-29 11:26:50,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +49: [2023-04-29 11:26:50,953] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +19: [2023-04-29 11:26:50,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +14: [2023-04-29 11:26:50,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +43: [2023-04-29 11:26:50,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 11:26:50,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +14: [2023-04-29 11:26:50,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 11:26:50,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +34: [2023-04-29 11:26:50,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +34: [2023-04-29 11:26:50,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 11:26:50,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +17: [2023-04-29 11:26:50,955] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +20: [2023-04-29 11:26:50,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +20: [2023-04-29 11:26:50,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +20: [2023-04-29 11:26:50,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +20: [2023-04-29 11:26:50,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +17: [2023-04-29 11:26:50,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +17: [2023-04-29 11:26:50,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +53: [2023-04-29 11:26:50,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +15: [2023-04-29 11:26:50,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +34: [2023-04-29 11:26:50,956] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +34: [2023-04-29 11:26:50,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 11:26:50,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 6: [2023-04-29 11:26:50,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +35: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +17: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +29: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +15: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +63: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 11:26:50,942] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +54: [2023-04-29 11:26:50,946] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +54: [2023-04-29 11:26:50,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 11:26:50,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +63: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +54: [2023-04-29 11:26:50,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +29: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +63: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 11:26:50,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 11:26:50,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +29: [2023-04-29 11:26:50,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +53: [2023-04-29 11:26:50,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +63: [2023-04-29 11:26:50,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 11:26:50,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 11:26:50,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +15: [2023-04-29 11:26:50,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +63: [2023-04-29 11:26:50,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 11:26:50,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +14: [2023-04-29 11:26:50,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 11:26:50,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 6: [2023-04-29 11:26:50,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +34: [2023-04-29 11:26:50,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 11:26:50,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 11:26:50,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +34: [2023-04-29 11:26:50,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +54: [2023-04-29 11:26:50,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 9: [2023-04-29 11:26:50,963] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +49: [2023-04-29 11:26:50,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 11:26:50,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 11:26:50,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 9: [2023-04-29 11:26:50,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +34: [2023-04-29 11:26:50,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +15: [2023-04-29 11:26:50,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +35: [2023-04-29 11:26:50,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 6: [2023-04-29 11:26:50,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +53: [2023-04-29 11:26:50,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_00-model_states.pt. +48: [2023-04-29 11:26:50,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +54: [2023-04-29 11:26:50,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +59: [2023-04-29 11:26:50,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 11:26:50,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 11:26:50,967] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +31: [2023-04-29 11:26:50,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +35: [2023-04-29 11:26:50,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 6: [2023-04-29 11:26:50,969] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 3: [2023-04-29 11:26:50,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +53: [2023-04-29 11:26:50,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... + 0: [2023-04-29 11:26:50,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +54: [2023-04-29 11:26:50,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +31: [2023-04-29 11:26:50,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +53: [2023-04-29 11:26:50,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt... +35: [2023-04-29 11:26:50,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 11:26:50,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +31: [2023-04-29 11:26:50,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,974] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +43: [2023-04-29 11:26:50,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 6: [2023-04-29 11:26:50,974] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +35: [2023-04-29 11:26:50,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +43: [2023-04-29 11:26:50,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 11:26:50,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 3: [2023-04-29 11:26:50,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,977] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +48: [2023-04-29 11:26:50,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +13: [2023-04-29 11:26:50,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +13: [2023-04-29 11:26:50,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +16: [2023-04-29 11:26:50,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +16: [2023-04-29 11:26:50,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +16: [2023-04-29 11:26:50,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 11:26:50,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 11:26:50,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +43: [2023-04-29 11:26:50,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 11:26:50,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +43: [2023-04-29 11:26:50,980] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 11:26:50,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +43: [2023-04-29 11:26:50,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 11:26:50,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +20: [2023-04-29 11:26:50,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +20: [2023-04-29 11:26:50,981] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 11:26:50,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +13: [2023-04-29 11:26:50,981] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 8: [2023-04-29 11:26:50,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 8: [2023-04-29 11:26:50,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +19: [2023-04-29 11:26:50,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 11:26:50,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +19: [2023-04-29 11:26:50,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +39: [2023-04-29 11:26:50,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +16: [2023-04-29 11:26:50,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 11:26:50,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 11:26:50,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +49: [2023-04-29 11:26:50,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 11:26:50,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +27: [2023-04-29 11:26:50,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +27: [2023-04-29 11:26:50,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +27: [2023-04-29 11:26:50,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +43: [2023-04-29 11:26:50,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +43: [2023-04-29 11:26:50,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +20: [2023-04-29 11:26:50,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +29: [2023-04-29 11:26:50,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 4: [2023-04-29 11:26:50,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 11:26:50,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 11:26:50,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 11:26:50,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +43: [2023-04-29 11:26:50,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +19: [2023-04-29 11:26:50,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +43: [2023-04-29 11:26:50,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 11:26:50,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +16: [2023-04-29 11:26:50,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 11:26:50,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 11:26:50,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 3: [2023-04-29 11:26:50,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +20: [2023-04-29 11:26:50,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 5: [2023-04-29 11:26:50,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 5: [2023-04-29 11:26:50,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 4: [2023-04-29 11:26:50,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +49: [2023-04-29 11:26:50,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 5: [2023-04-29 11:26:50,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +29: [2023-04-29 11:26:50,988] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 11:26:50,989] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +29: [2023-04-29 11:26:50,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 8: [2023-04-29 11:26:50,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 8: [2023-04-29 11:26:50,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 8: [2023-04-29 11:26:50,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +12: [2023-04-29 11:26:50,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 11:26:50,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 11:26:50,991] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 11:26:50,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +39: [2023-04-29 11:26:50,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 11:26:50,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +25: [2023-04-29 11:26:50,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +62: [2023-04-29 11:26:50,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 11:26:50,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 11:26:50,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 11:26:50,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 11:26:50,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +59: [2023-04-29 11:26:50,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 11:26:50,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 11:26:50,997] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +10: [2023-04-29 11:26:50,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +37: [2023-04-29 11:26:50,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +37: [2023-04-29 11:26:50,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 0: [2023-04-29 11:26:50,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +27: [2023-04-29 11:26:50,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 11:26:50,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 11:26:50,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +59: [2023-04-29 11:26:50,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 11:26:51,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +62: [2023-04-29 11:26:50,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 11:26:51,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +25: [2023-04-29 11:26:51,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +23: [2023-04-29 11:26:51,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 11:26:51,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +46: [2023-04-29 11:26:51,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 11:26:51,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 11:26:51,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 11:26:51,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +10: [2023-04-29 11:26:51,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 11:26:51,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +63: [2023-04-29 11:26:51,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +18: [2023-04-29 11:26:51,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 11:26:51,001] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 11:26:51,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +46: [2023-04-29 11:26:51,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 11:26:51,002] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +63: [2023-04-29 11:26:51,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt... +63: [2023-04-29 11:26:51,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt... +63: [2023-04-29 11:26:51,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt... +63: [2023-04-29 11:26:51,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt... +37: [2023-04-29 11:26:51,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 11:26:51,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 11:26:51,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 11:26:51,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 11:26:51,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 11:26:51,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +60: [2023-04-29 11:26:51,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +60: [2023-04-29 11:26:51,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +60: [2023-04-29 11:26:51,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +37: [2023-04-29 11:26:51,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +23: [2023-04-29 11:26:51,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +23: [2023-04-29 11:26:51,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +60: [2023-04-29 11:26:51,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +10: [2023-04-29 11:26:51,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 11:26:51,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +18: [2023-04-29 11:26:51,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +25: [2023-04-29 11:26:51,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +12: [2023-04-29 11:26:51,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +63: [2023-04-29 11:26:51,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +25: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 3: [2023-04-29 11:26:51,006] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +23: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +46: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +24: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +24: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +24: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +24: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +18: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +46: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +13: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +14: [2023-04-29 11:26:51,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +46: [2023-04-29 11:26:51,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +13: [2023-04-29 11:26:51,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt... + 7: [2023-04-29 11:26:51,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt... + 7: [2023-04-29 11:26:51,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt... + 7: [2023-04-29 11:26:51,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt... +39: [2023-04-29 11:26:51,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +23: [2023-04-29 11:26:51,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +23: [2023-04-29 11:26:51,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 11:26:51,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 11:26:51,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +32: [2023-04-29 11:26:51,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 11:26:51,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 11:26:51,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 11:26:51,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 11:26:51,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +18: [2023-04-29 11:26:51,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +45: [2023-04-29 11:26:51,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +25: [2023-04-29 11:26:51,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +23: [2023-04-29 11:26:51,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 11:26:51,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 11:26:51,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +55: [2023-04-29 11:26:51,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +13: [2023-04-29 11:26:51,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 11:26:51,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +59: [2023-04-29 11:26:51,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +23: [2023-04-29 11:26:51,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 11:26:51,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 11:26:51,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 11:26:51,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +18: [2023-04-29 11:26:51,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +45: [2023-04-29 11:26:51,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +45: [2023-04-29 11:26:51,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 11:26:51,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 11:26:51,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 11:26:51,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +40: [2023-04-29 11:26:51,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 11:26:51,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +63: [2023-04-29 11:26:51,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +39: [2023-04-29 11:26:51,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +23: [2023-04-29 11:26:51,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +39: [2023-04-29 11:26:51,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +23: [2023-04-29 11:26:51,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +12: [2023-04-29 11:26:51,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +27: [2023-04-29 11:26:51,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 11:26:51,016] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +27: [2023-04-29 11:26:51,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +12: [2023-04-29 11:26:51,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +23: [2023-04-29 11:26:51,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +32: [2023-04-29 11:26:51,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +32: [2023-04-29 11:26:51,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +32: [2023-04-29 11:26:51,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. + 5: [2023-04-29 11:26:51,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +32: [2023-04-29 11:26:51,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +23: [2023-04-29 11:26:51,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +39: [2023-04-29 11:26:51,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 11:26:51,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 11:26:51,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 11:26:51,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +14: [2023-04-29 11:26:51,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 11:26:51,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 11:26:51,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 4: [2023-04-29 11:26:51,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +39: [2023-04-29 11:26:51,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +10: [2023-04-29 11:26:51,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +10: [2023-04-29 11:26:51,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +10: [2023-04-29 11:26:51,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +55: [2023-04-29 11:26:51,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 11:26:51,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +55: [2023-04-29 11:26:51,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 11:26:51,020] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 11:26:51,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 11:26:51,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 11:26:51,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 11:26:51,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 11:26:51,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 11:26:51,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 11:26:51,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 11:26:51,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 11:26:51,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +34: [2023-04-29 11:26:51,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 11:26:51,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +17: [2023-04-29 11:26:51,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +63: [2023-04-29 11:26:51,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +14: [2023-04-29 11:26:51,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +63: [2023-04-29 11:26:51,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... + 0: [2023-04-29 11:26:51,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 11:26:51,025] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +28: [2023-04-29 11:26:51,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +28: [2023-04-29 11:26:51,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +17: [2023-04-29 11:26:51,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +14: [2023-04-29 11:26:51,026] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 11:26:51,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +51: [2023-04-29 11:26:51,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +51: [2023-04-29 11:26:51,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +28: [2023-04-29 11:26:51,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +27: [2023-04-29 11:26:51,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 11:26:51,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +17: [2023-04-29 11:26:51,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 11:26:51,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +33: [2023-04-29 11:26:51,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +43: [2023-04-29 11:26:51,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt... +43: [2023-04-29 11:26:51,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt... +43: [2023-04-29 11:26:51,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt... +43: [2023-04-29 11:26:51,029] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt... + 9: [2023-04-29 11:26:51,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +57: [2023-04-29 11:26:51,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +57: [2023-04-29 11:26:51,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +57: [2023-04-29 11:26:51,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +57: [2023-04-29 11:26:51,030] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 11:26:51,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 11:26:51,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 11:26:51,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 11:26:51,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +24: [2023-04-29 11:26:51,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +31: [2023-04-29 11:26:51,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +63: [2023-04-29 11:26:51,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +17: [2023-04-29 11:26:51,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +60: [2023-04-29 11:26:51,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +45: [2023-04-29 11:26:51,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 11:26:51,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +17: [2023-04-29 11:26:51,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +14: [2023-04-29 11:26:51,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +34: [2023-04-29 11:26:51,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +24: [2023-04-29 11:26:51,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 6: [2023-04-29 11:26:51,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,034] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +60: [2023-04-29 11:26:51,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +60: [2023-04-29 11:26:51,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 6: [2023-04-29 11:26:51,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +45: [2023-04-29 11:26:51,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +17: [2023-04-29 11:26:51,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +57: [2023-04-29 11:26:51,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 11:26:51,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 11:26:51,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +31: [2023-04-29 11:26:51,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +40: [2023-04-29 11:26:51,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 11:26:51,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +27: [2023-04-29 11:26:51,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +24: [2023-04-29 11:26:51,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +24: [2023-04-29 11:26:51,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +41: [2023-04-29 11:26:51,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 11:26:51,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +17: [2023-04-29 11:26:51,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +57: [2023-04-29 11:26:51,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 11:26:51,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 11:26:51,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 11:26:51,040] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 11:26:51,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 11:26:51,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +31: [2023-04-29 11:26:51,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +51: [2023-04-29 11:26:51,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +34: [2023-04-29 11:26:51,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 11:26:51,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +16: [2023-04-29 11:26:51,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +16: [2023-04-29 11:26:51,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +34: [2023-04-29 11:26:51,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 11:26:51,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +33: [2023-04-29 11:26:51,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +33: [2023-04-29 11:26:51,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +33: [2023-04-29 11:26:51,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +33: [2023-04-29 11:26:51,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +33: [2023-04-29 11:26:51,039] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 11:26:51,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 11:26:51,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +29: [2023-04-29 11:26:51,042] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,042] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 11:26:51,043] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +41: [2023-04-29 11:26:51,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 11:26:51,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:51,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 11:26:51,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:51,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 11:26:51,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:51,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +29: [2023-04-29 11:26:51,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +29: [2023-04-29 11:26:51,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 3: [2023-04-29 11:26:51,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +40: [2023-04-29 11:26:51,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +31: [2023-04-29 11:26:51,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +31: [2023-04-29 11:26:51,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +40: [2023-04-29 11:26:51,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 11:26:51,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +19: [2023-04-29 11:26:51,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 11:26:51,049] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +21: [2023-04-29 11:26:51,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +21: [2023-04-29 11:26:51,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +32: [2023-04-29 11:26:51,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 11:26:51,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +21: [2023-04-29 11:26:51,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 3: [2023-04-29 11:26:51,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 11:26:51,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 11:26:51,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 11:26:51,050] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 11:26:51,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +55: [2023-04-29 11:26:51,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +25: [2023-04-29 11:26:51,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +32: [2023-04-29 11:26:51,052] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 11:26:51,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 11:26:51,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 11:26:51,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +55: [2023-04-29 11:26:51,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +28: [2023-04-29 11:26:51,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +28: [2023-04-29 11:26:51,054] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +19: [2023-04-29 11:26:51,055] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 11:26:51,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:51,055] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 11:26:51,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 3: [2023-04-29 11:26:51,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +25: [2023-04-29 11:26:51,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:51,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 11:26:51,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 11:26:51,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +37: [2023-04-29 11:26:51,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 11:26:51,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +19: [2023-04-29 11:26:51,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 11:26:51,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 2: [2023-04-29 11:26:51,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 2: [2023-04-29 11:26:51,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 2: [2023-04-29 11:26:51,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 9: [2023-04-29 11:26:51,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 11:26:51,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +34: [2023-04-29 11:26:51,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +33: [2023-04-29 11:26:51,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 11:26:51,045] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +22: [2023-04-29 11:26:51,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +22: [2023-04-29 11:26:51,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 9: [2023-04-29 11:26:51,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +22: [2023-04-29 11:26:51,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +33: [2023-04-29 11:26:51,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +16: [2023-04-29 11:26:51,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +22: [2023-04-29 11:26:51,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +20: [2023-04-29 11:26:51,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +33: [2023-04-29 11:26:51,048] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 11:26:51,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 11:26:51,051] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +33: [2023-04-29 11:26:51,049] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,057] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +20: [2023-04-29 11:26:51,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +33: [2023-04-29 11:26:51,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +20: [2023-04-29 11:26:51,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +33: [2023-04-29 11:26:51,056] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +33: [2023-04-29 11:26:51,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,058] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 4: [2023-04-29 11:26:51,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +33: [2023-04-29 11:26:51,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +28: [2023-04-29 11:26:51,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +47: [2023-04-29 11:26:51,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 11:26:51,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +29: [2023-04-29 11:26:51,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +32: [2023-04-29 11:26:51,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 3: [2023-04-29 11:26:51,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 11:26:51,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +32: [2023-04-29 11:26:51,061] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +19: [2023-04-29 11:26:51,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +62: [2023-04-29 11:26:51,062] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +29: [2023-04-29 11:26:51,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +32: [2023-04-29 11:26:51,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +20: [2023-04-29 11:26:51,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +20: [2023-04-29 11:26:51,064] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +47: [2023-04-29 11:26:51,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 11:26:51,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,065] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 11:26:51,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +29: [2023-04-29 11:26:51,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +38: [2023-04-29 11:26:51,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 11:26:51,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 11:26:51,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 11:26:51,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 11:26:51,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +62: [2023-04-29 11:26:51,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +62: [2023-04-29 11:26:51,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 11:26:51,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +19: [2023-04-29 11:26:51,068] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +47: [2023-04-29 11:26:51,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 11:26:51,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 11:26:51,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 11:26:51,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +29: [2023-04-29 11:26:51,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +34: [2023-04-29 11:26:51,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +16: [2023-04-29 11:26:51,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +16: [2023-04-29 11:26:51,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +37: [2023-04-29 11:26:51,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +20: [2023-04-29 11:26:51,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +34: [2023-04-29 11:26:51,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +34: [2023-04-29 11:26:51,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +16: [2023-04-29 11:26:51,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +38: [2023-04-29 11:26:51,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 11:26:51,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +16: [2023-04-29 11:26:51,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +38: [2023-04-29 11:26:51,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 11:26:51,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +38: [2023-04-29 11:26:51,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 11:26:51,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 11:26:51,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +38: [2023-04-29 11:26:51,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +16: [2023-04-29 11:26:51,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 11:26:51,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +16: [2023-04-29 11:26:51,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 11:26:51,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +52: [2023-04-29 11:26:51,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 11:26:51,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 11:26:51,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 11:26:51,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 11:26:51,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 11:26:51,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 11:26:51,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 11:26:51,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +39: [2023-04-29 11:26:51,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt... +39: [2023-04-29 11:26:51,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt... +39: [2023-04-29 11:26:51,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt... +39: [2023-04-29 11:26:51,078] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt... +27: [2023-04-29 11:26:51,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +37: [2023-04-29 11:26:51,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +16: [2023-04-29 11:26:51,079] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +60: [2023-04-29 11:26:51,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 11:26:51,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 11:26:51,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 11:26:51,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +27: [2023-04-29 11:26:51,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +53: [2023-04-29 11:26:51,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 11:26:51,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +13: [2023-04-29 11:26:51,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 11:26:51,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 11:26:51,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +50: [2023-04-29 11:26:51,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 11:26:51,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 11:26:51,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 11:26:51,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 11:26:51,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 11:26:51,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +23: [2023-04-29 11:26:51,081] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:51,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +22: [2023-04-29 11:26:51,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 11:26:51,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +46: [2023-04-29 11:26:51,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +21: [2023-04-29 11:26:51,083] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +21: [2023-04-29 11:26:51,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +21: [2023-04-29 11:26:51,084] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +56: [2023-04-29 11:26:51,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 11:26:51,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +23: [2023-04-29 11:26:51,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +56: [2023-04-29 11:26:51,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 11:26:51,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +39: [2023-04-29 11:26:51,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +39: [2023-04-29 11:26:51,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +39: [2023-04-29 11:26:51,085] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +39: [2023-04-29 11:26:51,086] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +60: [2023-04-29 11:26:51,086] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 11:26:51,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 11:26:51,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 11:26:51,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 11:26:51,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 11:26:51,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +23: [2023-04-29 11:26:51,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +60: [2023-04-29 11:26:51,088] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +60: [2023-04-29 11:26:51,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 11:26:51,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 11:26:51,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +13: [2023-04-29 11:26:51,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +13: [2023-04-29 11:26:51,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +58: [2023-04-29 11:26:51,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +58: [2023-04-29 11:26:51,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +13: [2023-04-29 11:26:51,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +62: [2023-04-29 11:26:51,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 11:26:51,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +56: [2023-04-29 11:26:51,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 11:26:51,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 11:26:51,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +56: [2023-04-29 11:26:51,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 11:26:51,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +13: [2023-04-29 11:26:51,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +50: [2023-04-29 11:26:51,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 11:26:51,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +60: [2023-04-29 11:26:51,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 2: [2023-04-29 11:26:51,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 5: [2023-04-29 11:26:51,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +50: [2023-04-29 11:26:51,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 2: [2023-04-29 11:26:51,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +43: [2023-04-29 11:26:51,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +43: [2023-04-29 11:26:51,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +43: [2023-04-29 11:26:51,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +43: [2023-04-29 11:26:51,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 2: [2023-04-29 11:26:51,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +23: [2023-04-29 11:26:51,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +57: [2023-04-29 11:26:51,092] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +22: [2023-04-29 11:26:51,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +27: [2023-04-29 11:26:51,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +27: [2023-04-29 11:26:51,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +51: [2023-04-29 11:26:51,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +22: [2023-04-29 11:26:51,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +24: [2023-04-29 11:26:51,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 11:26:51,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +60: [2023-04-29 11:26:51,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 11:26:51,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 11:26:51,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +62: [2023-04-29 11:26:51,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 11:26:51,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 11:26:51,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 11:26:51,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 11:26:51,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +27: [2023-04-29 11:26:51,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +62: [2023-04-29 11:26:51,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 11:26:51,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +24: [2023-04-29 11:26:51,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +62: [2023-04-29 11:26:51,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 11:26:51,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 11:26:51,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +27: [2023-04-29 11:26:51,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +42: [2023-04-29 11:26:51,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:51,102] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 11:26:51,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +60: [2023-04-29 11:26:51,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +62: [2023-04-29 11:26:51,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 11:26:51,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +60: [2023-04-29 11:26:51,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +60: [2023-04-29 11:26:51,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 11:26:51,103] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +33: [2023-04-29 11:26:51,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt... +33: [2023-04-29 11:26:51,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt... +33: [2023-04-29 11:26:51,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt... +33: [2023-04-29 11:26:51,104] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt... +57: [2023-04-29 11:26:51,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:51,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 11:26:51,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 11:26:51,105] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 11:26:51,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 11:26:51,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +36: [2023-04-29 11:26:51,105] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +36: [2023-04-29 11:26:51,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +24: [2023-04-29 11:26:51,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +46: [2023-04-29 11:26:51,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 11:26:51,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +46: [2023-04-29 11:26:51,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 11:26:51,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +24: [2023-04-29 11:26:51,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +24: [2023-04-29 11:26:51,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,107] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +57: [2023-04-29 11:26:51,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +42: [2023-04-29 11:26:51,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 11:26:51,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +58: [2023-04-29 11:26:51,108] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,108] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +60: [2023-04-29 11:26:51,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +60: [2023-04-29 11:26:51,109] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +46: [2023-04-29 11:26:51,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 11:26:51,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 11:26:51,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +51: [2023-04-29 11:26:51,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 11:26:51,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 11:26:51,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 11:26:51,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +42: [2023-04-29 11:26:51,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +42: [2023-04-29 11:26:51,111] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +28: [2023-04-29 11:26:51,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +60: [2023-04-29 11:26:51,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 11:26:51,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +58: [2023-04-29 11:26:51,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 11:26:51,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:51,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 11:26:51,112] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +39: [2023-04-29 11:26:51,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +39: [2023-04-29 11:26:51,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:51,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +24: [2023-04-29 11:26:51,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +24: [2023-04-29 11:26:51,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +24: [2023-04-29 11:26:51,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +28: [2023-04-29 11:26:51,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 11:26:51,116] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +58: [2023-04-29 11:26:51,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 11:26:51,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +49: [2023-04-29 11:26:51,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +39: [2023-04-29 11:26:51,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 11:26:51,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:51,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 11:26:51,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 4: [2023-04-29 11:26:51,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt... + 4: [2023-04-29 11:26:51,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt... +58: [2023-04-29 11:26:51,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 11:26:51,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +58: [2023-04-29 11:26:51,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 11:26:51,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +57: [2023-04-29 11:26:51,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 11:26:51,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt... + 4: [2023-04-29 11:26:51,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt... +58: [2023-04-29 11:26:51,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +28: [2023-04-29 11:26:51,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 11:26:51,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +58: [2023-04-29 11:26:51,120] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +32: [2023-04-29 11:26:51,119] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +60: [2023-04-29 11:26:51,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +44: [2023-04-29 11:26:51,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 11:26:51,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +44: [2023-04-29 11:26:51,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +33: [2023-04-29 11:26:51,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +33: [2023-04-29 11:26:51,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +44: [2023-04-29 11:26:51,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 11:26:51,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +44: [2023-04-29 11:26:51,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +58: [2023-04-29 11:26:51,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +33: [2023-04-29 11:26:51,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +25: [2023-04-29 11:26:51,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +43: [2023-04-29 11:26:51,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 11:26:51,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 11:26:51,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 11:26:51,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +25: [2023-04-29 11:26:51,125] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +32: [2023-04-29 11:26:51,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +33: [2023-04-29 11:26:51,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +44: [2023-04-29 11:26:51,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +28: [2023-04-29 11:26:51,125] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +44: [2023-04-29 11:26:51,126] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,126] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +51: [2023-04-29 11:26:51,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +28: [2023-04-29 11:26:51,127] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +44: [2023-04-29 11:26:51,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 11:26:51,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 11:26:51,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 11:26:51,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 11:26:51,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +25: [2023-04-29 11:26:51,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +44: [2023-04-29 11:26:51,129] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +21: [2023-04-29 11:26:51,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +52: [2023-04-29 11:26:51,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 11:26:51,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +28: [2023-04-29 11:26:51,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +36: [2023-04-29 11:26:51,133] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +21: [2023-04-29 11:26:51,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +28: [2023-04-29 11:26:51,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +47: [2023-04-29 11:26:51,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 11:26:51,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 11:26:51,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 11:26:51,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 11:26:51,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 11:26:51,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 11:26:51,134] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 11:26:51,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 11:26:51,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 11:26:51,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 11:26:51,135] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 11:26:51,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 11:26:51,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +16: [2023-04-29 11:26:51,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt... +57: [2023-04-29 11:26:51,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +16: [2023-04-29 11:26:51,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt... +16: [2023-04-29 11:26:51,136] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt... +36: [2023-04-29 11:26:51,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +36: [2023-04-29 11:26:51,137] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +16: [2023-04-29 11:26:51,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt... +57: [2023-04-29 11:26:51,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 11:26:51,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 11:26:51,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +47: [2023-04-29 11:26:51,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 11:26:51,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 11:26:51,140] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 11:26:51,140] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 11:26:51,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +51: [2023-04-29 11:26:51,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 11:26:51,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 11:26:51,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +25: [2023-04-29 11:26:51,142] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +51: [2023-04-29 11:26:51,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 11:26:51,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +38: [2023-04-29 11:26:51,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 11:26:51,143] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +54: [2023-04-29 11:26:51,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 11:26:51,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 11:26:51,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 11:26:51,143] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 11:26:51,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +49: [2023-04-29 11:26:51,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 11:26:51,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 11:26:51,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 11:26:51,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 11:26:51,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,146] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +52: [2023-04-29 11:26:51,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +32: [2023-04-29 11:26:51,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 11:26:51,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +49: [2023-04-29 11:26:51,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +51: [2023-04-29 11:26:51,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 11:26:51,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 11:26:51,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 11:26:51,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 11:26:51,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 11:26:51,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 11:26:51,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 11:26:51,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 11:26:51,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 11:26:51,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 11:26:51,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 11:26:51,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 11:26:51,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +54: [2023-04-29 11:26:51,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 11:26:51,150] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +25: [2023-04-29 11:26:51,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +35: [2023-04-29 11:26:51,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 11:26:51,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +25: [2023-04-29 11:26:51,151] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +35: [2023-04-29 11:26:51,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 11:26:51,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 11:26:51,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +28: [2023-04-29 11:26:51,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +47: [2023-04-29 11:26:51,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +60: [2023-04-29 11:26:51,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +21: [2023-04-29 11:26:51,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +21: [2023-04-29 11:26:51,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 11:26:51,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +33: [2023-04-29 11:26:51,154] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +35: [2023-04-29 11:26:51,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 11:26:51,154] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +32: [2023-04-29 11:26:51,155] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +22: [2023-04-29 11:26:51,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +22: [2023-04-29 11:26:51,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +53: [2023-04-29 11:26:51,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 11:26:51,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 11:26:51,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,156] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +35: [2023-04-29 11:26:51,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 11:26:51,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +16: [2023-04-29 11:26:51,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 11:26:51,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +33: [2023-04-29 11:26:51,158] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 11:26:51,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 11:26:51,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +26: [2023-04-29 11:26:51,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +26: [2023-04-29 11:26:51,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +21: [2023-04-29 11:26:51,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +33: [2023-04-29 11:26:51,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +26: [2023-04-29 11:26:51,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +35: [2023-04-29 11:26:51,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +21: [2023-04-29 11:26:51,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +21: [2023-04-29 11:26:51,161] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +33: [2023-04-29 11:26:51,159] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 11:26:51,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +26: [2023-04-29 11:26:51,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +18: [2023-04-29 11:26:51,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 11:26:51,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 11:26:51,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 11:26:51,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 11:26:51,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +22: [2023-04-29 11:26:51,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +16: [2023-04-29 11:26:51,162] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +56: [2023-04-29 11:26:51,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +16: [2023-04-29 11:26:51,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +52: [2023-04-29 11:26:51,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +60: [2023-04-29 11:26:51,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 11:26:51,163] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +16: [2023-04-29 11:26:51,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +60: [2023-04-29 11:26:51,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +16: [2023-04-29 11:26:51,165] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 2: [2023-04-29 11:26:51,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +18: [2023-04-29 11:26:51,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 11:26:51,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +18: [2023-04-29 11:26:51,166] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 11:26:51,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt... +23: [2023-04-29 11:26:51,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt... +23: [2023-04-29 11:26:51,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt... +23: [2023-04-29 11:26:51,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt... +18: [2023-04-29 11:26:51,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +48: [2023-04-29 11:26:51,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 11:26:51,167] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +18: [2023-04-29 11:26:51,168] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +52: [2023-04-29 11:26:51,169] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +22: [2023-04-29 11:26:51,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +16: [2023-04-29 11:26:51,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +62: [2023-04-29 11:26:51,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt... + 2: [2023-04-29 11:26:51,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 11:26:51,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. + 2: [2023-04-29 11:26:51,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +62: [2023-04-29 11:26:51,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt... +62: [2023-04-29 11:26:51,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt... +62: [2023-04-29 11:26:51,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt... +47: [2023-04-29 11:26:51,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +47: [2023-04-29 11:26:51,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 11:26:51,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 11:26:51,171] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 11:26:51,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 11:26:51,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 2: [2023-04-29 11:26:51,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +36: [2023-04-29 11:26:51,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +36: [2023-04-29 11:26:51,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 11:26:51,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 11:26:51,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +36: [2023-04-29 11:26:51,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 11:26:51,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +36: [2023-04-29 11:26:51,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 11:26:51,173] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +13: [2023-04-29 11:26:51,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +48: [2023-04-29 11:26:51,174] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +22: [2023-04-29 11:26:51,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +42: [2023-04-29 11:26:51,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:51,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 11:26:51,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 11:26:51,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 11:26:51,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +50: [2023-04-29 11:26:51,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 11:26:51,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 11:26:51,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +13: [2023-04-29 11:26:51,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 2: [2023-04-29 11:26:51,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +52: [2023-04-29 11:26:51,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +13: [2023-04-29 11:26:51,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 11:26:51,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... + 2: [2023-04-29 11:26:51,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +48: [2023-04-29 11:26:51,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 2: [2023-04-29 11:26:51,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +36: [2023-04-29 11:26:51,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 11:26:51,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 11:26:51,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +13: [2023-04-29 11:26:51,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 11:26:51,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +36: [2023-04-29 11:26:51,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +11: [2023-04-29 11:26:51,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +11: [2023-04-29 11:26:51,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +48: [2023-04-29 11:26:51,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 11:26:51,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 11:26:51,180] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +11: [2023-04-29 11:26:51,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +60: [2023-04-29 11:26:51,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 11:26:51,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 11:26:51,181] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +11: [2023-04-29 11:26:51,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +38: [2023-04-29 11:26:51,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 11:26:51,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 11:26:51,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 11:26:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 11:26:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 11:26:51,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,182] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 11:26:51,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +47: [2023-04-29 11:26:51,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +22: [2023-04-29 11:26:51,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +38: [2023-04-29 11:26:51,183] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 11:26:51,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 11:26:51,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 11:26:51,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 7: [2023-04-29 11:26:51,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +53: [2023-04-29 11:26:51,184] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 11:26:51,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. + 7: [2023-04-29 11:26:51,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_19-model_01-model_states.pt. +42: [2023-04-29 11:26:51,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 11:26:51,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 11:26:51,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +44: [2023-04-29 11:26:51,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +60: [2023-04-29 11:26:51,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 11:26:51,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 11:26:51,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 11:26:51,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 11:26:51,186] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 11:26:51,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 11:26:51,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 11:26:51,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 11:26:51,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +39: [2023-04-29 11:26:51,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 11:26:51,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 11:26:51,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +28: [2023-04-29 11:26:51,187] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 11:26:51,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +26: [2023-04-29 11:26:51,187] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +50: [2023-04-29 11:26:51,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +43: [2023-04-29 11:26:51,190] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +58: [2023-04-29 11:26:51,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +38: [2023-04-29 11:26:51,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 11:26:51,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 11:26:51,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 11:26:51,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 11:26:51,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 11:26:51,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 11:26:51,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 11:26:51,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 11:26:51,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 11:26:51,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +56: [2023-04-29 11:26:51,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 11:26:51,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 11:26:51,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +39: [2023-04-29 11:26:51,192] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +43: [2023-04-29 11:26:51,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 11:26:51,192] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +26: [2023-04-29 11:26:51,193] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +62: [2023-04-29 11:26:51,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +62: [2023-04-29 11:26:51,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +62: [2023-04-29 11:26:51,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +62: [2023-04-29 11:26:51,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +58: [2023-04-29 11:26:51,194] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +58: [2023-04-29 11:26:51,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 11:26:51,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 11:26:51,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +39: [2023-04-29 11:26:51,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 11:26:51,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +44: [2023-04-29 11:26:51,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 11:26:51,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 11:26:51,196] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +26: [2023-04-29 11:26:51,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +58: [2023-04-29 11:26:51,197] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 11:26:51,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +43: [2023-04-29 11:26:51,198] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +60: [2023-04-29 11:26:51,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 11:26:51,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 11:26:51,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 11:26:51,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 11:26:51,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 11:26:51,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 11:26:51,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 11:26:51,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 11:26:51,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 11:26:51,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 11:26:51,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 11:26:51,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 11:26:51,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 11:26:51,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 11:26:51,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +30: [2023-04-29 11:26:51,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 11:26:51,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +36: [2023-04-29 11:26:51,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +30: [2023-04-29 11:26:51,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +39: [2023-04-29 11:26:51,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +51: [2023-04-29 11:26:51,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt... +51: [2023-04-29 11:26:51,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt... +51: [2023-04-29 11:26:51,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt... +51: [2023-04-29 11:26:51,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt... +61: [2023-04-29 11:26:51,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 11:26:51,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +58: [2023-04-29 11:26:51,202] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 11:26:51,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +59: [2023-04-29 11:26:51,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +59: [2023-04-29 11:26:51,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +30: [2023-04-29 11:26:51,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +36: [2023-04-29 11:26:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 11:26:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +49: [2023-04-29 11:26:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 11:26:51,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +49: [2023-04-29 11:26:51,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 11:26:51,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +49: [2023-04-29 11:26:51,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 11:26:51,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +49: [2023-04-29 11:26:51,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +30: [2023-04-29 11:26:51,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +36: [2023-04-29 11:26:51,206] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt... + 6: [2023-04-29 11:26:51,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt... + 6: [2023-04-29 11:26:51,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt... + 6: [2023-04-29 11:26:51,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt... +30: [2023-04-29 11:26:51,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 11:26:51,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +54: [2023-04-29 11:26:51,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +36: [2023-04-29 11:26:51,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +61: [2023-04-29 11:26:51,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 11:26:51,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +30: [2023-04-29 11:26:51,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +42: [2023-04-29 11:26:51,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 11:26:51,208] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 11:26:51,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 11:26:51,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +28: [2023-04-29 11:26:51,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +49: [2023-04-29 11:26:51,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 11:26:51,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 11:26:51,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... + 7: [2023-04-29 11:26:51,209] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +11: [2023-04-29 11:26:51,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +49: [2023-04-29 11:26:51,210] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 11:26:51,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +42: [2023-04-29 11:26:51,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +49: [2023-04-29 11:26:51,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 11:26:51,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 11:26:51,212] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +36: [2023-04-29 11:26:51,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +54: [2023-04-29 11:26:51,213] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 11:26:51,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 11:26:51,214] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 11:26:51,215] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +35: [2023-04-29 11:26:51,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +11: [2023-04-29 11:26:51,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 11:26:51,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +51: [2023-04-29 11:26:51,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +51: [2023-04-29 11:26:51,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +51: [2023-04-29 11:26:51,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +51: [2023-04-29 11:26:51,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +49: [2023-04-29 11:26:51,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +49: [2023-04-29 11:26:51,218] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:51,218] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 11:26:51,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +38: [2023-04-29 11:26:51,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +38: [2023-04-29 11:26:51,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +38: [2023-04-29 11:26:51,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +38: [2023-04-29 11:26:51,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +33: [2023-04-29 11:26:51,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,219] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt... +54: [2023-04-29 11:26:51,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 11:26:51,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +49: [2023-04-29 11:26:51,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +11: [2023-04-29 11:26:51,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 11:26:51,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +49: [2023-04-29 11:26:51,223] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +11: [2023-04-29 11:26:51,223] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +62: [2023-04-29 11:26:51,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 11:26:51,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +33: [2023-04-29 11:26:51,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +54: [2023-04-29 11:26:51,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +54: [2023-04-29 11:26:51,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +54: [2023-04-29 11:26:51,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +54: [2023-04-29 11:26:51,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +54: [2023-04-29 11:26:51,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 11:26:51,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 11:26:51,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +35: [2023-04-29 11:26:51,226] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +58: [2023-04-29 11:26:51,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 11:26:51,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 11:26:51,226] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +28: [2023-04-29 11:26:51,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +62: [2023-04-29 11:26:51,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +59: [2023-04-29 11:26:51,227] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +28: [2023-04-29 11:26:51,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +59: [2023-04-29 11:26:51,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +59: [2023-04-29 11:26:51,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +59: [2023-04-29 11:26:51,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +46: [2023-04-29 11:26:51,229] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +46: [2023-04-29 11:26:51,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +46: [2023-04-29 11:26:51,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +58: [2023-04-29 11:26:51,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 11:26:51,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 11:26:51,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +46: [2023-04-29 11:26:51,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +58: [2023-04-29 11:26:51,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 11:26:51,230] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +61: [2023-04-29 11:26:51,230] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 11:26:51,231] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +33: [2023-04-29 11:26:51,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +33: [2023-04-29 11:26:51,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +61: [2023-04-29 11:26:51,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +33: [2023-04-29 11:26:51,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +18: [2023-04-29 11:26:51,233] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 11:26:51,234] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +59: [2023-04-29 11:26:51,236] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +54: [2023-04-29 11:26:51,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:51,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +61: [2023-04-29 11:26:51,238] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +13: [2023-04-29 11:26:51,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +33: [2023-04-29 11:26:51,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +33: [2023-04-29 11:26:51,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +59: [2023-04-29 11:26:51,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +30: [2023-04-29 11:26:51,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +30: [2023-04-29 11:26:51,239] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +33: [2023-04-29 11:26:51,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 0: [2023-04-29 11:26:51,239] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +35: [2023-04-29 11:26:51,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 11:26:51,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 11:26:51,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +18: [2023-04-29 11:26:51,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +48: [2023-04-29 11:26:51,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 11:26:51,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 11:26:51,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 11:26:51,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +59: [2023-04-29 11:26:51,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 11:26:51,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 11:26:51,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 11:26:51,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +30: [2023-04-29 11:26:51,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 0: [2023-04-29 11:26:51,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 11:26:51,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 6: [2023-04-29 11:26:51,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 6: [2023-04-29 11:26:51,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 3: [2023-04-29 11:26:51,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 11:26:51,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +35: [2023-04-29 11:26:51,243] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 11:26:51,244] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +51: [2023-04-29 11:26:51,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 11:26:51,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 3: [2023-04-29 11:26:51,244] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +58: [2023-04-29 11:26:51,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 11:26:51,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 11:26:51,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 11:26:51,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 11:26:51,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 11:26:51,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 11:26:51,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 11:26:51,245] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 11:26:51,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 11:26:51,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 11:26:51,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 11:26:51,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 11:26:51,247] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt... + 9: [2023-04-29 11:26:51,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt... + 9: [2023-04-29 11:26:51,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt... + 9: [2023-04-29 11:26:51,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt... +38: [2023-04-29 11:26:51,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 11:26:51,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 11:26:51,248] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 11:26:51,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 11:26:51,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 11:26:51,250] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 11:26:51,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 11:26:51,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 11:26:51,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 11:26:51,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 11:26:51,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 11:26:51,251] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +48: [2023-04-29 11:26:51,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 11:26:51,251] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 11:26:51,252] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 11:26:51,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +36: [2023-04-29 11:26:51,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +36: [2023-04-29 11:26:51,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 11:26:51,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt... +60: [2023-04-29 11:26:51,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt... +60: [2023-04-29 11:26:51,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt... +60: [2023-04-29 11:26:51,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt... +36: [2023-04-29 11:26:51,253] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 11:26:51,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 11:26:51,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt... +56: [2023-04-29 11:26:51,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt... +56: [2023-04-29 11:26:51,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt... +56: [2023-04-29 11:26:51,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt... +54: [2023-04-29 11:26:51,254] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 11:26:51,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +46: [2023-04-29 11:26:51,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 11:26:51,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +27: [2023-04-29 11:26:51,256] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +54: [2023-04-29 11:26:51,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 11:26:51,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +54: [2023-04-29 11:26:51,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 11:26:51,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +27: [2023-04-29 11:26:51,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 11:26:51,257] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 11:26:51,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 11:26:51,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +26: [2023-04-29 11:26:51,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +40: [2023-04-29 11:26:51,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 11:26:51,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 11:26:51,258] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 11:26:51,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 11:26:51,258] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 11:26:51,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 11:26:51,259] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 11:26:51,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 11:26:51,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt... +40: [2023-04-29 11:26:51,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 11:26:51,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt... +38: [2023-04-29 11:26:51,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt... +18: [2023-04-29 11:26:51,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +18: [2023-04-29 11:26:51,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +54: [2023-04-29 11:26:51,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +38: [2023-04-29 11:26:51,260] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt... +40: [2023-04-29 11:26:51,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +46: [2023-04-29 11:26:51,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +46: [2023-04-29 11:26:51,261] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +18: [2023-04-29 11:26:51,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +18: [2023-04-29 11:26:51,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +18: [2023-04-29 11:26:51,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +40: [2023-04-29 11:26:51,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +26: [2023-04-29 11:26:51,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +26: [2023-04-29 11:26:51,263] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +49: [2023-04-29 11:26:51,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 11:26:51,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 11:26:51,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +54: [2023-04-29 11:26:51,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 11:26:51,265] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +54: [2023-04-29 11:26:51,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +26: [2023-04-29 11:26:51,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +13: [2023-04-29 11:26:51,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +40: [2023-04-29 11:26:51,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 11:26:51,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +30: [2023-04-29 11:26:51,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +36: [2023-04-29 11:26:51,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 11:26:51,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +35: [2023-04-29 11:26:51,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +30: [2023-04-29 11:26:51,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 11:26:51,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +48: [2023-04-29 11:26:51,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 11:26:51,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 11:26:51,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +30: [2023-04-29 11:26:51,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +35: [2023-04-29 11:26:51,272] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +55: [2023-04-29 11:26:51,273] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +26: [2023-04-29 11:26:51,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +26: [2023-04-29 11:26:51,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +55: [2023-04-29 11:26:51,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +36: [2023-04-29 11:26:51,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 11:26:51,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 11:26:51,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 11:26:51,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +13: [2023-04-29 11:26:51,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 11:26:51,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 6: [2023-04-29 11:26:51,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 11:26:51,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +48: [2023-04-29 11:26:51,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 11:26:51,275] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +36: [2023-04-29 11:26:51,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 11:26:51,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 11:26:51,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 11:26:51,276] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +11: [2023-04-29 11:26:51,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +30: [2023-04-29 11:26:51,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +63: [2023-04-29 11:26:51,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 6: [2023-04-29 11:26:51,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +63: [2023-04-29 11:26:51,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +63: [2023-04-29 11:26:51,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +63: [2023-04-29 11:26:51,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +55: [2023-04-29 11:26:51,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 11:26:51,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 11:26:51,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +55: [2023-04-29 11:26:51,278] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 11:26:51,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 11:26:51,279] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 11:26:51,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +13: [2023-04-29 11:26:51,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +36: [2023-04-29 11:26:51,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 11:26:51,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +26: [2023-04-29 11:26:51,281] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +36: [2023-04-29 11:26:51,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 11:26:51,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +36: [2023-04-29 11:26:51,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 11:26:51,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 11:26:51,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 11:26:51,283] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 11:26:51,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 11:26:51,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +49: [2023-04-29 11:26:51,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 11:26:51,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +36: [2023-04-29 11:26:51,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +13: [2023-04-29 11:26:51,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +36: [2023-04-29 11:26:51,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 11:26:51,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 11:26:51,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +36: [2023-04-29 11:26:51,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,286] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +36: [2023-04-29 11:26:51,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 11:26:51,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +36: [2023-04-29 11:26:51,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,286] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +62: [2023-04-29 11:26:51,287] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 11:26:51,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 11:26:51,288] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 11:26:51,289] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +30: [2023-04-29 11:26:51,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 11:26:51,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 11:26:51,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +62: [2023-04-29 11:26:51,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +49: [2023-04-29 11:26:51,292] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 11:26:51,292] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +24: [2023-04-29 11:26:51,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 11:26:51,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +49: [2023-04-29 11:26:51,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +24: [2023-04-29 11:26:51,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 11:26:51,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +62: [2023-04-29 11:26:51,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +18: [2023-04-29 11:26:51,295] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +45: [2023-04-29 11:26:51,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 11:26:51,295] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 11:26:51,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 11:26:51,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +18: [2023-04-29 11:26:51,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 11:26:51,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +18: [2023-04-29 11:26:51,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +30: [2023-04-29 11:26:51,296] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_00-model_states.pt. +11: [2023-04-29 11:26:51,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 11:26:51,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 11:26:51,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +62: [2023-04-29 11:26:51,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +24: [2023-04-29 11:26:51,298] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +62: [2023-04-29 11:26:51,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 8: [2023-04-29 11:26:51,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +24: [2023-04-29 11:26:51,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 11:26:51,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 8: [2023-04-29 11:26:51,299] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 8: [2023-04-29 11:26:51,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +54: [2023-04-29 11:26:51,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt... +54: [2023-04-29 11:26:51,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt... +54: [2023-04-29 11:26:51,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt... +45: [2023-04-29 11:26:51,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 11:26:51,300] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt... +45: [2023-04-29 11:26:51,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 11:26:51,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 11:26:51,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 11:26:51,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 11:26:51,300] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 11:26:51,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +45: [2023-04-29 11:26:51,303] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,304] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt... +11: [2023-04-29 11:26:51,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +11: [2023-04-29 11:26:51,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 11:26:51,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 11:26:51,306] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt. + 2: [2023-04-29 11:26:51,306] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 16 +11: [2023-04-29 11:26:51,305] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +59: [2023-04-29 11:26:51,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +59: [2023-04-29 11:26:51,306] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +62: [2023-04-29 11:26:51,307] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 0: [2023-04-29 11:26:51,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +46: [2023-04-29 11:26:51,308] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +29: [2023-04-29 11:26:51,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 11:26:51,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 11:26:51,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +38: [2023-04-29 11:26:51,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +29: [2023-04-29 11:26:51,310] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +63: [2023-04-29 11:26:51,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +63: [2023-04-29 11:26:51,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +63: [2023-04-29 11:26:51,312] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +59: [2023-04-29 11:26:51,311] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +51: [2023-04-29 11:26:51,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +34: [2023-04-29 11:26:51,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +34: [2023-04-29 11:26:51,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +22: [2023-04-29 11:26:51,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 11:26:51,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +46: [2023-04-29 11:26:51,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +22: [2023-04-29 11:26:51,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +58: [2023-04-29 11:26:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt... +58: [2023-04-29 11:26:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt... +58: [2023-04-29 11:26:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt... +58: [2023-04-29 11:26:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt... +22: [2023-04-29 11:26:51,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 11:26:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +11: [2023-04-29 11:26:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +34: [2023-04-29 11:26:51,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +63: [2023-04-29 11:26:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +29: [2023-04-29 11:26:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 11:26:51,314] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +34: [2023-04-29 11:26:51,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +38: [2023-04-29 11:26:51,315] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +51: [2023-04-29 11:26:51,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 11:26:51,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +29: [2023-04-29 11:26:51,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +49: [2023-04-29 11:26:51,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +29: [2023-04-29 11:26:51,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +49: [2023-04-29 11:26:51,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 11:26:51,317] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +49: [2023-04-29 11:26:51,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 11:26:51,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +59: [2023-04-29 11:26:51,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +49: [2023-04-29 11:26:51,318] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +14: [2023-04-29 11:26:51,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +14: [2023-04-29 11:26:51,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +49: [2023-04-29 11:26:51,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 11:26:51,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +49: [2023-04-29 11:26:51,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,319] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:51,319] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +34: [2023-04-29 11:26:51,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 11:26:51,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 11:26:51,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 11:26:51,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +22: [2023-04-29 11:26:51,320] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 11:26:51,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +34: [2023-04-29 11:26:51,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +46: [2023-04-29 11:26:51,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +34: [2023-04-29 11:26:51,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +51: [2023-04-29 11:26:51,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +30: [2023-04-29 11:26:51,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 11:26:51,321] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +55: [2023-04-29 11:26:51,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +55: [2023-04-29 11:26:51,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +51: [2023-04-29 11:26:51,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +34: [2023-04-29 11:26:51,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +55: [2023-04-29 11:26:51,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +49: [2023-04-29 11:26:51,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 11:26:51,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +30: [2023-04-29 11:26:51,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +38: [2023-04-29 11:26:51,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 11:26:51,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +30: [2023-04-29 11:26:51,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +49: [2023-04-29 11:26:51,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 11:26:51,322] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 11:26:51,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +49: [2023-04-29 11:26:51,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +14: [2023-04-29 11:26:51,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +14: [2023-04-29 11:26:51,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +59: [2023-04-29 11:26:51,324] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 11:26:51,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +41: [2023-04-29 11:26:51,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +41: [2023-04-29 11:26:51,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +46: [2023-04-29 11:26:51,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +54: [2023-04-29 11:26:51,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +41: [2023-04-29 11:26:51,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +46: [2023-04-29 11:26:51,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +59: [2023-04-29 11:26:51,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +14: [2023-04-29 11:26:51,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +54: [2023-04-29 11:26:51,326] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +38: [2023-04-29 11:26:51,326] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +14: [2023-04-29 11:26:51,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +27: [2023-04-29 11:26:51,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 11:26:51,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +51: [2023-04-29 11:26:51,327] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +27: [2023-04-29 11:26:51,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +38: [2023-04-29 11:26:51,328] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +59: [2023-04-29 11:26:51,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 11:26:51,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +37: [2023-04-29 11:26:51,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +38: [2023-04-29 11:26:51,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +14: [2023-04-29 11:26:51,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +51: [2023-04-29 11:26:51,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 8: [2023-04-29 11:26:51,329] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 11:26:51,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 11:26:51,330] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +14: [2023-04-29 11:26:51,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +46: [2023-04-29 11:26:51,331] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +54: [2023-04-29 11:26:51,332] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +37: [2023-04-29 11:26:51,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +37: [2023-04-29 11:26:51,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +40: [2023-04-29 11:26:51,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +12: [2023-04-29 11:26:51,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +12: [2023-04-29 11:26:51,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +12: [2023-04-29 11:26:51,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +36: [2023-04-29 11:26:51,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt... +36: [2023-04-29 11:26:51,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt... +36: [2023-04-29 11:26:51,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt... +36: [2023-04-29 11:26:51,333] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt... +40: [2023-04-29 11:26:51,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +12: [2023-04-29 11:26:51,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +54: [2023-04-29 11:26:51,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +54: [2023-04-29 11:26:51,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 11:26:51,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +30: [2023-04-29 11:26:51,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +48: [2023-04-29 11:26:51,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt... +48: [2023-04-29 11:26:51,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt... +48: [2023-04-29 11:26:51,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt... +48: [2023-04-29 11:26:51,334] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt... +37: [2023-04-29 11:26:51,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 11:26:51,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +25: [2023-04-29 11:26:51,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +25: [2023-04-29 11:26:51,337] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +46: [2023-04-29 11:26:51,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +48: [2023-04-29 11:26:51,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +48: [2023-04-29 11:26:51,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +30: [2023-04-29 11:26:51,339] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +48: [2023-04-29 11:26:51,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +48: [2023-04-29 11:26:51,339] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. + 0: > overriding learning rate value to 0.0002 + 0: > overriding minimum learning rate value to 2e-05 + 0: > overriding warmup iterations value to 0 + 0: > overriding total number of iterations value to 1 + 0: > overriding decay style value to cosine +12: [2023-04-29 11:26:51,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +56: [2023-04-29 11:26:51,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +56: [2023-04-29 11:26:51,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +56: [2023-04-29 11:26:51,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +12: [2023-04-29 11:26:51,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +54: [2023-04-29 11:26:51,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +37: [2023-04-29 11:26:51,340] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 11:26:51,341] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +37: [2023-04-29 11:26:51,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 11:26:51,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +12: [2023-04-29 11:26:51,341] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +56: [2023-04-29 11:26:51,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +30: [2023-04-29 11:26:51,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +12: [2023-04-29 11:26:51,342] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 11:26:51,343] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt. +37: [2023-04-29 11:26:51,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +19: [2023-04-29 11:26:51,343] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 152 +26: [2023-04-29 11:26:51,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 11:26:51,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 11:26:51,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +23: [2023-04-29 11:26:51,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +46: [2023-04-29 11:26:51,344] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +40: [2023-04-29 11:26:51,345] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +23: [2023-04-29 11:26:51,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +23: [2023-04-29 11:26:51,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +30: [2023-04-29 11:26:51,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 11:26:51,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +25: [2023-04-29 11:26:51,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +55: [2023-04-29 11:26:51,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +12: [2023-04-29 11:26:51,346] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +26: [2023-04-29 11:26:51,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 11:26:51,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 11:26:51,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,346] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 11:26:51,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 11:26:51,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 11:26:51,347] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +34: [2023-04-29 11:26:51,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +34: [2023-04-29 11:26:51,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +30: [2023-04-29 11:26:51,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +59: [2023-04-29 11:26:51,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 11:26:51,348] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +46: [2023-04-29 11:26:51,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +46: [2023-04-29 11:26:51,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 11:26:51,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 11:26:51,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 11:26:51,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 11:26:51,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 11:26:51,349] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +46: [2023-04-29 11:26:51,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +19: [2023-04-29 11:26:51,349] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 152 +40: [2023-04-29 11:26:51,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +15: [2023-04-29 11:26:51,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +15: [2023-04-29 11:26:51,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +15: [2023-04-29 11:26:51,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 1: [2023-04-29 11:26:51,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 1: [2023-04-29 11:26:51,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 1: [2023-04-29 11:26:51,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 0: [2023-04-29 11:26:51,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 6: [2023-04-29 11:26:51,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 0: [2023-04-29 11:26:51,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 0: [2023-04-29 11:26:51,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +20: [2023-04-29 11:26:51,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +15: [2023-04-29 11:26:51,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 0: [2023-04-29 11:26:51,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +55: [2023-04-29 11:26:51,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +20: [2023-04-29 11:26:51,350] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 11:26:51,350] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 11:26:51,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +26: [2023-04-29 11:26:51,351] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 11:26:51,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 11:26:51,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 11:26:51,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 11:26:51,351] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 11:26:51,352] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +59: [2023-04-29 11:26:51,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 11:26:51,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 6: [2023-04-29 11:26:51,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +26: [2023-04-29 11:26:51,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +59: [2023-04-29 11:26:51,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 11:26:51,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +20: [2023-04-29 11:26:51,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +20: [2023-04-29 11:26:51,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +46: [2023-04-29 11:26:51,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,353] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +46: [2023-04-29 11:26:51,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +18: [2023-04-29 11:26:51,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,354] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +46: [2023-04-29 11:26:51,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +20: [2023-04-29 11:26:51,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +46: [2023-04-29 11:26:51,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:51,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 11:26:51,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +20: [2023-04-29 11:26:51,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +41: [2023-04-29 11:26:51,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 11:26:51,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +10: [2023-04-29 11:26:51,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +10: [2023-04-29 11:26:51,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +34: [2023-04-29 11:26:51,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +18: [2023-04-29 11:26:51,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +34: [2023-04-29 11:26:51,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +10: [2023-04-29 11:26:51,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 6: [2023-04-29 11:26:51,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +24: [2023-04-29 11:26:51,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 11:26:51,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 11:26:51,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 11:26:51,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:51,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 11:26:51,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +41: [2023-04-29 11:26:51,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +25: [2023-04-29 11:26:51,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +15: [2023-04-29 11:26:51,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 11:26:51,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +55: [2023-04-29 11:26:51,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 11:26:51,359] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 2: [2023-04-29 11:26:51,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt. + 2: [2023-04-29 11:26:51,360] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 20 +18: [2023-04-29 11:26:51,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +17: [2023-04-29 11:26:51,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +17: [2023-04-29 11:26:51,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +57: [2023-04-29 11:26:51,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +57: [2023-04-29 11:26:51,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +18: [2023-04-29 11:26:51,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 5: [2023-04-29 11:26:51,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +55: [2023-04-29 11:26:51,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +25: [2023-04-29 11:26:51,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +61: [2023-04-29 11:26:51,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +61: [2023-04-29 11:26:51,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +61: [2023-04-29 11:26:51,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +48: [2023-04-29 11:26:51,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 11:26:51,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +61: [2023-04-29 11:26:51,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +59: [2023-04-29 11:26:51,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +25: [2023-04-29 11:26:51,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +40: [2023-04-29 11:26:51,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 11:26:51,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +24: [2023-04-29 11:26:51,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 11:26:51,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 11:26:51,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +40: [2023-04-29 11:26:51,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 11:26:51,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 11:26:51,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 11:26:51,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +17: [2023-04-29 11:26:51,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +40: [2023-04-29 11:26:51,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 11:26:51,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 11:26:51,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 11:26:51,363] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +17: [2023-04-29 11:26:51,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +40: [2023-04-29 11:26:51,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +25: [2023-04-29 11:26:51,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +45: [2023-04-29 11:26:51,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +12: [2023-04-29 11:26:51,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +12: [2023-04-29 11:26:51,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:51,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +59: [2023-04-29 11:26:51,364] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +30: [2023-04-29 11:26:51,364] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +59: [2023-04-29 11:26:51,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 11:26:51,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 11:26:51,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 11:26:51,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 11:26:51,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +21: [2023-04-29 11:26:51,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 11:26:51,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +37: [2023-04-29 11:26:51,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +31: [2023-04-29 11:26:51,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 11:26:51,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 11:26:51,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +31: [2023-04-29 11:26:51,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 11:26:51,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 11:26:51,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 11:26:51,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +57: [2023-04-29 11:26:51,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 11:26:51,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 11:26:51,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 11:26:51,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 11:26:51,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +19: [2023-04-29 11:26:51,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt. +37: [2023-04-29 11:26:51,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 11:26:51,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 11:26:51,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +25: [2023-04-29 11:26:51,367] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +19: [2023-04-29 11:26:51,367] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 154 +59: [2023-04-29 11:26:51,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 11:26:51,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 11:26:51,368] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +21: [2023-04-29 11:26:51,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +59: [2023-04-29 11:26:51,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 11:26:51,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 11:26:51,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +21: [2023-04-29 11:26:51,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +55: [2023-04-29 11:26:51,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 11:26:51,369] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 11:26:51,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +31: [2023-04-29 11:26:51,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +31: [2023-04-29 11:26:51,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +31: [2023-04-29 11:26:51,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +30: [2023-04-29 11:26:51,370] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +31: [2023-04-29 11:26:51,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 8: [2023-04-29 11:26:51,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 11:26:51,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +56: [2023-04-29 11:26:51,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +48: [2023-04-29 11:26:51,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +21: [2023-04-29 11:26:51,371] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 11:26:51,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 11:26:51,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +31: [2023-04-29 11:26:51,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 11:26:51,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +48: [2023-04-29 11:26:51,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 11:26:51,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +23: [2023-04-29 11:26:51,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 11:26:51,372] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 11:26:51,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 11:26:51,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:51,372] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +29: [2023-04-29 11:26:51,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +55: [2023-04-29 11:26:51,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 11:26:51,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +55: [2023-04-29 11:26:51,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +23: [2023-04-29 11:26:51,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +57: [2023-04-29 11:26:51,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +31: [2023-04-29 11:26:51,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 11:26:51,373] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +55: [2023-04-29 11:26:51,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +21: [2023-04-29 11:26:51,374] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +45: [2023-04-29 11:26:51,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 11:26:51,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +19: [2023-04-29 11:26:51,375] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 154 + 1: [2023-04-29 11:26:51,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +49: [2023-04-29 11:26:51,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt... +49: [2023-04-29 11:26:51,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt... +49: [2023-04-29 11:26:51,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt... + 3: [2023-04-29 11:26:51,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 3: [2023-04-29 11:26:51,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 3: [2023-04-29 11:26:51,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +21: [2023-04-29 11:26:51,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 9: [2023-04-29 11:26:51,375] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 3: [2023-04-29 11:26:51,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +49: [2023-04-29 11:26:51,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt... +23: [2023-04-29 11:26:51,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +34: [2023-04-29 11:26:51,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 11:26:51,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +25: [2023-04-29 11:26:51,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,376] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +18: [2023-04-29 11:26:51,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +32: [2023-04-29 11:26:51,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +32: [2023-04-29 11:26:51,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 9: [2023-04-29 11:26:51,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +32: [2023-04-29 11:26:51,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 8: [2023-04-29 11:26:51,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 11:26:51,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 11:26:51,377] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +32: [2023-04-29 11:26:51,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +56: [2023-04-29 11:26:51,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 11:26:51,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +11: [2023-04-29 11:26:51,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt. + 1: [2023-04-29 11:26:51,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +11: [2023-04-29 11:26:51,379] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 94 +47: [2023-04-29 11:26:51,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 11:26:51,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 11:26:51,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 11:26:51,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt... + 3: [2023-04-29 11:26:51,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt... + 3: [2023-04-29 11:26:51,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt... + 3: [2023-04-29 11:26:51,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt... +22: [2023-04-29 11:26:51,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +47: [2023-04-29 11:26:51,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +10: [2023-04-29 11:26:51,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +55: [2023-04-29 11:26:51,381] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 11:26:51,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 11:26:51,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +15: [2023-04-29 11:26:51,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +63: [2023-04-29 11:26:51,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 11:26:51,382] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,382] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 11:26:51,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +63: [2023-04-29 11:26:51,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +63: [2023-04-29 11:26:51,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 11:26:51,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 11:26:51,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 11:26:51,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 11:26:51,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,384] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt... + 0: [2023-04-29 11:26:51,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt... + 0: [2023-04-29 11:26:51,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt... +47: [2023-04-29 11:26:51,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,385] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt... +47: [2023-04-29 11:26:51,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +22: [2023-04-29 11:26:51,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 11:26:51,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 11:26:51,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +15: [2023-04-29 11:26:51,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 11:26:51,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 11:26:51,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +14: [2023-04-29 11:26:51,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +14: [2023-04-29 11:26:51,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +14: [2023-04-29 11:26:51,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +61: [2023-04-29 11:26:51,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +11: [2023-04-29 11:26:51,388] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 94 +14: [2023-04-29 11:26:51,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +17: [2023-04-29 11:26:51,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +47: [2023-04-29 11:26:51,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +29: [2023-04-29 11:26:51,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +47: [2023-04-29 11:26:51,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 11:26:51,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +24: [2023-04-29 11:26:51,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +24: [2023-04-29 11:26:51,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +34: [2023-04-29 11:26:51,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 11:26:51,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +63: [2023-04-29 11:26:51,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +24: [2023-04-29 11:26:51,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 11:26:51,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +63: [2023-04-29 11:26:51,391] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +17: [2023-04-29 11:26:51,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 11:26:51,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +61: [2023-04-29 11:26:51,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +63: [2023-04-29 11:26:51,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +17: [2023-04-29 11:26:51,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +44: [2023-04-29 11:26:51,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +44: [2023-04-29 11:26:51,392] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +44: [2023-04-29 11:26:51,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +17: [2023-04-29 11:26:51,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +44: [2023-04-29 11:26:51,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +34: [2023-04-29 11:26:51,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +14: [2023-04-29 11:26:51,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 11:26:51,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 11:26:51,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 11:26:51,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +61: [2023-04-29 11:26:51,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +17: [2023-04-29 11:26:51,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +61: [2023-04-29 11:26:51,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +17: [2023-04-29 11:26:51,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +19: [2023-04-29 11:26:51,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +19: [2023-04-29 11:26:51,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +19: [2023-04-29 11:26:51,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +34: [2023-04-29 11:26:51,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 11:26:51,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 11:26:51,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 11:26:51,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 11:26:51,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 11:26:51,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 11:26:51,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +19: [2023-04-29 11:26:51,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +32: [2023-04-29 11:26:51,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +63: [2023-04-29 11:26:51,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +31: [2023-04-29 11:26:51,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:51,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt. +45: [2023-04-29 11:26:51,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +29: [2023-04-29 11:26:51,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 11:26:51,398] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 90 +29: [2023-04-29 11:26:51,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +45: [2023-04-29 11:26:51,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 11:26:51,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +29: [2023-04-29 11:26:51,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +10: [2023-04-29 11:26:51,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 11:26:51,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 11:26:51,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +45: [2023-04-29 11:26:51,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 11:26:51,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +29: [2023-04-29 11:26:51,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +45: [2023-04-29 11:26:51,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +24: [2023-04-29 11:26:51,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +32: [2023-04-29 11:26:51,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +22: [2023-04-29 11:26:51,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 11:26:51,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 11:26:51,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +31: [2023-04-29 11:26:51,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 8: [2023-04-29 11:26:51,401] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +14: [2023-04-29 11:26:51,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +60: [2023-04-29 11:26:51,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +60: [2023-04-29 11:26:51,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +60: [2023-04-29 11:26:51,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +60: [2023-04-29 11:26:51,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +10: [2023-04-29 11:26:51,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt. +10: [2023-04-29 11:26:51,403] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 86 +55: [2023-04-29 11:26:51,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +31: [2023-04-29 11:26:51,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 11:26:51,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +55: [2023-04-29 11:26:51,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 11:26:51,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 11:26:51,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 11:26:51,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +27: [2023-04-29 11:26:51,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt... +27: [2023-04-29 11:26:51,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt... +27: [2023-04-29 11:26:51,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt... +27: [2023-04-29 11:26:51,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt... +47: [2023-04-29 11:26:51,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +47: [2023-04-29 11:26:51,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. + 2: [2023-04-29 11:26:51,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt. +45: [2023-04-29 11:26:51,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. + 2: [2023-04-29 11:26:51,405] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 18 +45: [2023-04-29 11:26:51,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. + 9: [2023-04-29 11:26:51,406] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:51,406] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 90 +47: [2023-04-29 11:26:51,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +47: [2023-04-29 11:26:51,407] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +22: [2023-04-29 11:26:51,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,408] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +55: [2023-04-29 11:26:51,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 11:26:51,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +14: [2023-04-29 11:26:51,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +55: [2023-04-29 11:26:51,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 11:26:51,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 11:26:51,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 11:26:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +40: [2023-04-29 11:26:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt... + 9: [2023-04-29 11:26:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +40: [2023-04-29 11:26:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt... +40: [2023-04-29 11:26:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt... +40: [2023-04-29 11:26:51,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt... + 2: [2023-04-29 11:26:51,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt. + 2: [2023-04-29 11:26:51,411] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 22 +45: [2023-04-29 11:26:51,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 11:26:51,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +10: [2023-04-29 11:26:51,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt. +45: [2023-04-29 11:26:51,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +10: [2023-04-29 11:26:51,412] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 84 +45: [2023-04-29 11:26:51,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 11:26:51,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 11:26:51,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 11:26:51,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +14: [2023-04-29 11:26:51,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +45: [2023-04-29 11:26:51,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,412] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 11:26:51,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +28: [2023-04-29 11:26:51,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +28: [2023-04-29 11:26:51,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +28: [2023-04-29 11:26:51,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +22: [2023-04-29 11:26:51,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +32: [2023-04-29 11:26:51,414] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 11:26:51,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 11:26:51,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 11:26:51,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +50: [2023-04-29 11:26:51,416] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +14: [2023-04-29 11:26:51,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +14: [2023-04-29 11:26:51,416] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +52: [2023-04-29 11:26:51,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 11:26:51,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 11:26:51,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +14: [2023-04-29 11:26:51,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +29: [2023-04-29 11:26:51,419] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,418] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +50: [2023-04-29 11:26:51,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +26: [2023-04-29 11:26:51,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 11:26:51,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +50: [2023-04-29 11:26:51,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +26: [2023-04-29 11:26:51,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +48: [2023-04-29 11:26:51,419] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +20: [2023-04-29 11:26:51,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +32: [2023-04-29 11:26:51,420] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +20: [2023-04-29 11:26:51,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +20: [2023-04-29 11:26:51,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +52: [2023-04-29 11:26:51,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +20: [2023-04-29 11:26:51,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +58: [2023-04-29 11:26:51,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +58: [2023-04-29 11:26:51,420] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +58: [2023-04-29 11:26:51,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +44: [2023-04-29 11:26:51,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 11:26:51,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 11:26:51,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 11:26:51,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +14: [2023-04-29 11:26:51,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +50: [2023-04-29 11:26:51,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +12: [2023-04-29 11:26:51,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 11:26:51,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 11:26:51,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +41: [2023-04-29 11:26:51,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +26: [2023-04-29 11:26:51,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +34: [2023-04-29 11:26:51,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 11:26:51,422] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +29: [2023-04-29 11:26:51,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +50: [2023-04-29 11:26:51,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 11:26:51,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +44: [2023-04-29 11:26:51,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +19: [2023-04-29 11:26:51,423] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 11:26:51,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +52: [2023-04-29 11:26:51,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 11:26:51,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,424] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +52: [2023-04-29 11:26:51,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +19: [2023-04-29 11:26:51,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +41: [2023-04-29 11:26:51,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 11:26:51,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 11:26:51,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +41: [2023-04-29 11:26:51,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +19: [2023-04-29 11:26:51,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +55: [2023-04-29 11:26:51,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt... +55: [2023-04-29 11:26:51,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt... +55: [2023-04-29 11:26:51,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt... +55: [2023-04-29 11:26:51,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt... +52: [2023-04-29 11:26:51,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +20: [2023-04-29 11:26:51,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 11:26:51,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +41: [2023-04-29 11:26:51,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +34: [2023-04-29 11:26:51,426] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +20: [2023-04-29 11:26:51,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 11:26:51,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +44: [2023-04-29 11:26:51,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +41: [2023-04-29 11:26:51,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 11:26:51,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +34: [2023-04-29 11:26:51,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 11:26:51,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 11:26:51,427] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 8: [2023-04-29 11:26:51,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +46: [2023-04-29 11:26:51,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 11:26:51,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +40: [2023-04-29 11:26:51,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +40: [2023-04-29 11:26:51,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +40: [2023-04-29 11:26:51,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +25: [2023-04-29 11:26:51,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 11:26:51,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +45: [2023-04-29 11:26:51,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +19: [2023-04-29 11:26:51,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:51,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +41: [2023-04-29 11:26:51,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 11:26:51,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:51,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 11:26:51,429] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +37: [2023-04-29 11:26:51,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,430] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 11:26:51,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +50: [2023-04-29 11:26:51,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:51,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:51,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +29: [2023-04-29 11:26:51,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +60: [2023-04-29 11:26:51,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +34: [2023-04-29 11:26:51,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +34: [2023-04-29 11:26:51,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 11:26:51,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +34: [2023-04-29 11:26:51,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 11:26:51,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +22: [2023-04-29 11:26:51,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt. +47: [2023-04-29 11:26:51,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,433] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 62 +22: [2023-04-29 11:26:51,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 11:26:51,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +46: [2023-04-29 11:26:51,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +25: [2023-04-29 11:26:51,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +25: [2023-04-29 11:26:51,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +55: [2023-04-29 11:26:51,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 11:26:51,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 11:26:51,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +60: [2023-04-29 11:26:51,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +60: [2023-04-29 11:26:51,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 11:26:51,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 11:26:51,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 11:26:51,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 11:26:51,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +15: [2023-04-29 11:26:51,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +41: [2023-04-29 11:26:51,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... + 8: [2023-04-29 11:26:51,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +41: [2023-04-29 11:26:51,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 11:26:51,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +47: [2023-04-29 11:26:51,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 11:26:51,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 8: [2023-04-29 11:26:51,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +14: [2023-04-29 11:26:51,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +41: [2023-04-29 11:26:51,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 11:26:51,436] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 11:26:51,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 11:26:51,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +29: [2023-04-29 11:26:51,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +34: [2023-04-29 11:26:51,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +11: [2023-04-29 11:26:51,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt. +11: [2023-04-29 11:26:51,438] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 88 +20: [2023-04-29 11:26:51,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +59: [2023-04-29 11:26:51,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt... +59: [2023-04-29 11:26:51,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt... +59: [2023-04-29 11:26:51,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt... +59: [2023-04-29 11:26:51,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt... +29: [2023-04-29 11:26:51,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +25: [2023-04-29 11:26:51,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +25: [2023-04-29 11:26:51,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 4: [2023-04-29 11:26:51,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 4: [2023-04-29 11:26:51,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 4: [2023-04-29 11:26:51,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +49: [2023-04-29 11:26:51,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +49: [2023-04-29 11:26:51,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +49: [2023-04-29 11:26:51,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +12: [2023-04-29 11:26:51,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 11:26:51,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +49: [2023-04-29 11:26:51,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +57: [2023-04-29 11:26:51,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +46: [2023-04-29 11:26:51,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 11:26:51,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +45: [2023-04-29 11:26:51,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 11:26:51,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +14: [2023-04-29 11:26:51,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +53: [2023-04-29 11:26:51,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +55: [2023-04-29 11:26:51,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +53: [2023-04-29 11:26:51,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,440] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 62 +57: [2023-04-29 11:26:51,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 11:26:51,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +28: [2023-04-29 11:26:51,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +37: [2023-04-29 11:26:51,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 11:26:51,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +56: [2023-04-29 11:26:51,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 11:26:51,440] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 11:26:51,440] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 11:26:51,441] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 4: [2023-04-29 11:26:51,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +57: [2023-04-29 11:26:51,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 11:26:51,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 11:26:51,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +21: [2023-04-29 11:26:51,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 11:26:51,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 11:26:51,441] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +37: [2023-04-29 11:26:51,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 11:26:51,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +48: [2023-04-29 11:26:51,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +25: [2023-04-29 11:26:51,443] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 11:26:51,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 11:26:51,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +31: [2023-04-29 11:26:51,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +37: [2023-04-29 11:26:51,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +12: [2023-04-29 11:26:51,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 11:26:51,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +50: [2023-04-29 11:26:51,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 11:26:51,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +56: [2023-04-29 11:26:51,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 11:26:51,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +56: [2023-04-29 11:26:51,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +31: [2023-04-29 11:26:51,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 11:26:51,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +50: [2023-04-29 11:26:51,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +56: [2023-04-29 11:26:51,446] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +28: [2023-04-29 11:26:51,447] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 11:26:51,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 11:26:51,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 11:26:51,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 11:26:51,447] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 88 +28: [2023-04-29 11:26:51,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +42: [2023-04-29 11:26:51,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 11:26:51,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +10: [2023-04-29 11:26:51,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +48: [2023-04-29 11:26:51,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +28: [2023-04-29 11:26:51,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +48: [2023-04-29 11:26:51,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +28: [2023-04-29 11:26:51,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 11:26:51,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 11:26:51,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 11:26:51,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 11:26:51,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +20: [2023-04-29 11:26:51,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +20: [2023-04-29 11:26:51,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +50: [2023-04-29 11:26:51,449] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +42: [2023-04-29 11:26:51,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 11:26:51,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +26: [2023-04-29 11:26:51,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 11:26:51,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +21: [2023-04-29 11:26:51,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +56: [2023-04-29 11:26:51,450] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +10: [2023-04-29 11:26:51,450] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt. +10: [2023-04-29 11:26:51,450] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 82 +42: [2023-04-29 11:26:51,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +26: [2023-04-29 11:26:51,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 11:26:51,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +37: [2023-04-29 11:26:51,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +58: [2023-04-29 11:26:51,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 11:26:51,451] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +34: [2023-04-29 11:26:51,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,451] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 11:26:51,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +28: [2023-04-29 11:26:51,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 11:26:51,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +58: [2023-04-29 11:26:51,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +61: [2023-04-29 11:26:51,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +25: [2023-04-29 11:26:51,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +58: [2023-04-29 11:26:51,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +23: [2023-04-29 11:26:51,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 11:26:51,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 11:26:51,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 11:26:51,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +12: [2023-04-29 11:26:51,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 11:26:51,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +10: [2023-04-29 11:26:51,454] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +21: [2023-04-29 11:26:51,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +46: [2023-04-29 11:26:51,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 11:26:51,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +26: [2023-04-29 11:26:51,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +55: [2023-04-29 11:26:51,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +55: [2023-04-29 11:26:51,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +56: [2023-04-29 11:26:51,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 11:26:51,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +53: [2023-04-29 11:26:51,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +53: [2023-04-29 11:26:51,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +53: [2023-04-29 11:26:51,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +42: [2023-04-29 11:26:51,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 11:26:51,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +23: [2023-04-29 11:26:51,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +23: [2023-04-29 11:26:51,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +20: [2023-04-29 11:26:51,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +42: [2023-04-29 11:26:51,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +21: [2023-04-29 11:26:51,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +34: [2023-04-29 11:26:51,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +25: [2023-04-29 11:26:51,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +37: [2023-04-29 11:26:51,456] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +61: [2023-04-29 11:26:51,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +55: [2023-04-29 11:26:51,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +20: [2023-04-29 11:26:51,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +61: [2023-04-29 11:26:51,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +61: [2023-04-29 11:26:51,457] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 11:26:51,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +61: [2023-04-29 11:26:51,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +61: [2023-04-29 11:26:51,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 11:26:51,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +42: [2023-04-29 11:26:51,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +42: [2023-04-29 11:26:51,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +37: [2023-04-29 11:26:51,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 11:26:51,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +34: [2023-04-29 11:26:51,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 11:26:51,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +17: [2023-04-29 11:26:51,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +37: [2023-04-29 11:26:51,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +34: [2023-04-29 11:26:51,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +37: [2023-04-29 11:26:51,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 11:26:51,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +23: [2023-04-29 11:26:51,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +37: [2023-04-29 11:26:51,459] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 11:26:51,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 11:26:51,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 11:26:51,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +34: [2023-04-29 11:26:51,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +23: [2023-04-29 11:26:51,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +31: [2023-04-29 11:26:51,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +42: [2023-04-29 11:26:51,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +15: [2023-04-29 11:26:51,460] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 2: [2023-04-29 11:26:51,461] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 16 +46: [2023-04-29 11:26:51,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 11:26:51,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 11:26:51,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 11:26:51,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 11:26:51,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 11:26:51,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +20: [2023-04-29 11:26:51,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +46: [2023-04-29 11:26:51,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 11:26:51,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 11:26:51,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 11:26:51,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +46: [2023-04-29 11:26:51,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 11:26:51,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 11:26:51,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +34: [2023-04-29 11:26:51,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +10: [2023-04-29 11:26:51,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt. +42: [2023-04-29 11:26:51,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +40: [2023-04-29 11:26:51,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +10: [2023-04-29 11:26:51,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 11:26:51,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +10: [2023-04-29 11:26:51,463] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 80 +57: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +40: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +17: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +17: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +34: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +15: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +40: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +40: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +34: [2023-04-29 11:26:51,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt... +45: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt... +45: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt... +45: [2023-04-29 11:26:51,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt... +15: [2023-04-29 11:26:51,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +61: [2023-04-29 11:26:51,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +10: [2023-04-29 11:26:51,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +25: [2023-04-29 11:26:51,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 5: [2023-04-29 11:26:51,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 11:26:51,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 11:26:51,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 11:26:51,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 11:26:51,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +55: [2023-04-29 11:26:51,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +34: [2023-04-29 11:26:51,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +61: [2023-04-29 11:26:51,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +61: [2023-04-29 11:26:51,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +17: [2023-04-29 11:26:51,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 7: [2023-04-29 11:26:51,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt. +55: [2023-04-29 11:26:51,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +61: [2023-04-29 11:26:51,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,466] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 56 +32: [2023-04-29 11:26:51,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +61: [2023-04-29 11:26:51,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,466] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +17: [2023-04-29 11:26:51,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +15: [2023-04-29 11:26:51,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +31: [2023-04-29 11:26:51,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 5: [2023-04-29 11:26:51,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 4: [2023-04-29 11:26:51,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +49: [2023-04-29 11:26:51,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 11:26:51,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +17: [2023-04-29 11:26:51,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +37: [2023-04-29 11:26:51,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +49: [2023-04-29 11:26:51,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 11:26:51,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 2: [2023-04-29 11:26:51,468] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 18 +31: [2023-04-29 11:26:51,468] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,468] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 11:26:51,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 4: [2023-04-29 11:26:51,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +55: [2023-04-29 11:26:51,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +57: [2023-04-29 11:26:51,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 11:26:51,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +10: [2023-04-29 11:26:51,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +15: [2023-04-29 11:26:51,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +47: [2023-04-29 11:26:51,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 11:26:51,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +57: [2023-04-29 11:26:51,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +17: [2023-04-29 11:26:51,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 0: [2023-04-29 11:26:51,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +20: [2023-04-29 11:26:51,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +57: [2023-04-29 11:26:51,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 11:26:51,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +10: [2023-04-29 11:26:51,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +46: [2023-04-29 11:26:51,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 11:26:51,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 11:26:51,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 11:26:51,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +46: [2023-04-29 11:26:51,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +15: [2023-04-29 11:26:51,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +57: [2023-04-29 11:26:51,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +21: [2023-04-29 11:26:51,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +32: [2023-04-29 11:26:51,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +37: [2023-04-29 11:26:51,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 11:26:51,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +10: [2023-04-29 11:26:51,471] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +37: [2023-04-29 11:26:51,471] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +49: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +27: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +27: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +27: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +57: [2023-04-29 11:26:51,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 11:26:51,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +61: [2023-04-29 11:26:51,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +15: [2023-04-29 11:26:51,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +27: [2023-04-29 11:26:51,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +17: [2023-04-29 11:26:51,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +21: [2023-04-29 11:26:51,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 0: [2023-04-29 11:26:51,473] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +31: [2023-04-29 11:26:51,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,474] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 56 +37: [2023-04-29 11:26:51,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +31: [2023-04-29 11:26:51,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +37: [2023-04-29 11:26:51,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 11:26:51,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +31: [2023-04-29 11:26:51,475] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 11:26:51,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 11:26:51,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +44: [2023-04-29 11:26:51,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 11:26:51,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 11:26:51,475] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 11:26:51,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 11:26:51,476] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,476] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +37: [2023-04-29 11:26:51,477] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +19: [2023-04-29 11:26:51,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 11:26:51,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +24: [2023-04-29 11:26:51,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +31: [2023-04-29 11:26:51,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +15: [2023-04-29 11:26:51,478] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 11:26:51,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +15: [2023-04-29 11:26:51,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +63: [2023-04-29 11:26:51,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt. +63: [2023-04-29 11:26:51,480] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 510 +21: [2023-04-29 11:26:51,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +61: [2023-04-29 11:26:51,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +61: [2023-04-29 11:26:51,480] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +24: [2023-04-29 11:26:51,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +19: [2023-04-29 11:26:51,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 3: [2023-04-29 11:26:51,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +44: [2023-04-29 11:26:51,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 11:26:51,481] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 11:26:51,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +44: [2023-04-29 11:26:51,482] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 11:26:51,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +36: [2023-04-29 11:26:51,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +36: [2023-04-29 11:26:51,482] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +21: [2023-04-29 11:26:51,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +44: [2023-04-29 11:26:51,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 11:26:51,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +57: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +57: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +14: [2023-04-29 11:26:51,483] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +52: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +31: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 9: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +52: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. + 3: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +53: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +34: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt... + 3: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 9: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +34: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt... +34: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt... +34: [2023-04-29 11:26:51,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt... +31: [2023-04-29 11:26:51,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +57: [2023-04-29 11:26:51,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +42: [2023-04-29 11:26:51,485] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 3: [2023-04-29 11:26:51,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +53: [2023-04-29 11:26:51,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +53: [2023-04-29 11:26:51,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +15: [2023-04-29 11:26:51,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +15: [2023-04-29 11:26:51,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +57: [2023-04-29 11:26:51,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +43: [2023-04-29 11:26:51,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt. +14: [2023-04-29 11:26:51,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +52: [2023-04-29 11:26:51,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +43: [2023-04-29 11:26:51,489] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 346 +52: [2023-04-29 11:26:51,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. + 8: [2023-04-29 11:26:51,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +42: [2023-04-29 11:26:51,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +21: [2023-04-29 11:26:51,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +44: [2023-04-29 11:26:51,489] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +34: [2023-04-29 11:26:51,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 11:26:51,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 11:26:51,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 2: [2023-04-29 11:26:51,490] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 20 +42: [2023-04-29 11:26:51,490] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... + 2: [2023-04-29 11:26:51,490] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 22 +17: [2023-04-29 11:26:51,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 11:26:51,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +43: [2023-04-29 11:26:51,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt. + 3: [2023-04-29 11:26:51,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +43: [2023-04-29 11:26:51,491] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 348 +31: [2023-04-29 11:26:51,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 3: [2023-04-29 11:26:51,492] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +52: [2023-04-29 11:26:51,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +14: [2023-04-29 11:26:51,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 11:26:51,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +11: [2023-04-29 11:26:51,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt. +60: [2023-04-29 11:26:51,493] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +11: [2023-04-29 11:26:51,493] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 92 + 8: [2023-04-29 11:26:51,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 8: [2023-04-29 11:26:51,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 11:26:51,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 11:26:51,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 11:26:51,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 11:26:51,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 11:26:51,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +45: [2023-04-29 11:26:51,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +13: [2023-04-29 11:26:51,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +13: [2023-04-29 11:26:51,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +19: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +47: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +47: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +52: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +44: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +14: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +19: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +37: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt... +37: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt... +37: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt... +37: [2023-04-29 11:26:51,495] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt... +47: [2023-04-29 11:26:51,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 11:26:51,496] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 346 + 5: [2023-04-29 11:26:51,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +15: [2023-04-29 11:26:51,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 11:26:51,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 11:26:51,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +13: [2023-04-29 11:26:51,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +22: [2023-04-29 11:26:51,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +22: [2023-04-29 11:26:51,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +45: [2023-04-29 11:26:51,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +28: [2023-04-29 11:26:51,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +29: [2023-04-29 11:26:51,497] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +34: [2023-04-29 11:26:51,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +60: [2023-04-29 11:26:51,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +31: [2023-04-29 11:26:51,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,498] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +41: [2023-04-29 11:26:51,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 11:26:51,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +22: [2023-04-29 11:26:51,498] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +43: [2023-04-29 11:26:51,499] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 348 +18: [2023-04-29 11:26:51,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 11:26:51,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +17: [2023-04-29 11:26:51,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +52: [2023-04-29 11:26:51,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +11: [2023-04-29 11:26:51,499] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 92 +22: [2023-04-29 11:26:51,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +13: [2023-04-29 11:26:51,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 11:26:51,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 11:26:51,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 11:26:51,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 11:26:51,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 11:26:51,500] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +50: [2023-04-29 11:26:51,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +18: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +19: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +14: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +15: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +19: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +60: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +46: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt... +46: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt... +27: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +46: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt... +27: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +46: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt... +29: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +28: [2023-04-29 11:26:51,501] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +14: [2023-04-29 11:26:51,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +47: [2023-04-29 11:26:51,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +27: [2023-04-29 11:26:51,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 11:26:51,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +44: [2023-04-29 11:26:51,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +44: [2023-04-29 11:26:51,502] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +50: [2023-04-29 11:26:51,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +39: [2023-04-29 11:26:51,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt. +39: [2023-04-29 11:26:51,503] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 312 +44: [2023-04-29 11:26:51,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +24: [2023-04-29 11:26:51,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +45: [2023-04-29 11:26:51,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +19: [2023-04-29 11:26:51,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +50: [2023-04-29 11:26:51,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +29: [2023-04-29 11:26:51,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +34: [2023-04-29 11:26:51,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +50: [2023-04-29 11:26:51,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +41: [2023-04-29 11:26:51,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 11:26:51,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 11:26:51,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +14: [2023-04-29 11:26:51,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +60: [2023-04-29 11:26:51,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 11:26:51,506] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 11:26:51,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 11:26:51,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +13: [2023-04-29 11:26:51,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +47: [2023-04-29 11:26:51,507] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +13: [2023-04-29 11:26:51,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +47: [2023-04-29 11:26:51,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 11:26:51,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +13: [2023-04-29 11:26:51,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +47: [2023-04-29 11:26:51,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +13: [2023-04-29 11:26:51,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +50: [2023-04-29 11:26:51,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 11:26:51,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 11:26:51,508] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 11:26:51,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +29: [2023-04-29 11:26:51,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +36: [2023-04-29 11:26:51,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 11:26:51,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +19: [2023-04-29 11:26:51,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +36: [2023-04-29 11:26:51,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 11:26:51,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +58: [2023-04-29 11:26:51,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 11:26:51,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 11:26:51,510] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 312 +24: [2023-04-29 11:26:51,510] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +47: [2023-04-29 11:26:51,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 11:26:51,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 11:26:51,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +47: [2023-04-29 11:26:51,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 11:26:51,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 11:26:51,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 11:26:51,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 11:26:51,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +60: [2023-04-29 11:26:51,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +24: [2023-04-29 11:26:51,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +24: [2023-04-29 11:26:51,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +60: [2023-04-29 11:26:51,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 11:26:51,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +45: [2023-04-29 11:26:51,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +28: [2023-04-29 11:26:51,511] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +47: [2023-04-29 11:26:51,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +29: [2023-04-29 11:26:51,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +36: [2023-04-29 11:26:51,512] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +14: [2023-04-29 11:26:51,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +29: [2023-04-29 11:26:51,513] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +47: [2023-04-29 11:26:51,513] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 11:26:51,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 11:26:51,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 11:26:51,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 11:26:51,514] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 11:26:51,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +52: [2023-04-29 11:26:51,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +58: [2023-04-29 11:26:51,514] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +57: [2023-04-29 11:26:51,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +57: [2023-04-29 11:26:51,515] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +50: [2023-04-29 11:26:51,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 11:26:51,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +50: [2023-04-29 11:26:51,516] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +32: [2023-04-29 11:26:51,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 11:26:51,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 11:26:51,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +57: [2023-04-29 11:26:51,517] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +47: [2023-04-29 11:26:51,517] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +60: [2023-04-29 11:26:51,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +20: [2023-04-29 11:26:51,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,518] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 11:26:51,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +32: [2023-04-29 11:26:51,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +20: [2023-04-29 11:26:51,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 11:26:51,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +26: [2023-04-29 11:26:51,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +26: [2023-04-29 11:26:51,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +29: [2023-04-29 11:26:51,520] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +26: [2023-04-29 11:26:51,521] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +52: [2023-04-29 11:26:51,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +45: [2023-04-29 11:26:51,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +29: [2023-04-29 11:26:51,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +50: [2023-04-29 11:26:51,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +50: [2023-04-29 11:26:51,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +58: [2023-04-29 11:26:51,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +45: [2023-04-29 11:26:51,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +52: [2023-04-29 11:26:51,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +25: [2023-04-29 11:26:51,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt... +47: [2023-04-29 11:26:51,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +25: [2023-04-29 11:26:51,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt... +25: [2023-04-29 11:26:51,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt... +25: [2023-04-29 11:26:51,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt... +28: [2023-04-29 11:26:51,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 11:26:51,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +20: [2023-04-29 11:26:51,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +20: [2023-04-29 11:26:51,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +52: [2023-04-29 11:26:51,524] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 11:26:51,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 11:26:51,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 11:26:51,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 11:26:51,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 11:26:51,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +13: [2023-04-29 11:26:51,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +22: [2023-04-29 11:26:51,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +59: [2023-04-29 11:26:51,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +59: [2023-04-29 11:26:51,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +59: [2023-04-29 11:26:51,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +22: [2023-04-29 11:26:51,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +28: [2023-04-29 11:26:51,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +47: [2023-04-29 11:26:51,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 2: [2023-04-29 11:26:51,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 2: [2023-04-29 11:26:51,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +59: [2023-04-29 11:26:51,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 2: [2023-04-29 11:26:51,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 2: [2023-04-29 11:26:51,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +58: [2023-04-29 11:26:51,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 11:26:51,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +13: [2023-04-29 11:26:51,528] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +40: [2023-04-29 11:26:51,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +20: [2023-04-29 11:26:51,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +13: [2023-04-29 11:26:51,529] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +49: [2023-04-29 11:26:51,529] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 11:26:51,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +41: [2023-04-29 11:26:51,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 11:26:51,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +57: [2023-04-29 11:26:51,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt... +57: [2023-04-29 11:26:51,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt... +57: [2023-04-29 11:26:51,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt... +57: [2023-04-29 11:26:51,530] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt... +28: [2023-04-29 11:26:51,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +22: [2023-04-29 11:26:51,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +41: [2023-04-29 11:26:51,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +52: [2023-04-29 11:26:51,531] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +13: [2023-04-29 11:26:51,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +52: [2023-04-29 11:26:51,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 11:26:51,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt. +52: [2023-04-29 11:26:51,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 11:26:51,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 11:26:51,532] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 508 +32: [2023-04-29 11:26:51,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +42: [2023-04-29 11:26:51,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 11:26:51,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 11:26:51,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +35: [2023-04-29 11:26:51,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +35: [2023-04-29 11:26:51,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +35: [2023-04-29 11:26:51,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_42-model_01-model_states.pt. +52: [2023-04-29 11:26:51,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 11:26:51,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:51,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 11:26:51,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 11:26:51,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 11:26:51,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 11:26:51,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 11:26:51,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +41: [2023-04-29 11:26:51,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 11:26:51,533] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 11:26:51,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 11:26:51,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 11:26:51,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 11:26:51,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 11:26:51,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 11:26:51,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 11:26:51,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 11:26:51,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +28: [2023-04-29 11:26:51,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +41: [2023-04-29 11:26:51,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 11:26:51,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +52: [2023-04-29 11:26:51,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 11:26:51,534] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +49: [2023-04-29 11:26:51,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 11:26:51,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 11:26:51,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 11:26:51,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +22: [2023-04-29 11:26:51,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +40: [2023-04-29 11:26:51,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +53: [2023-04-29 11:26:51,535] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +52: [2023-04-29 11:26:51,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +20: [2023-04-29 11:26:51,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +21: [2023-04-29 11:26:51,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 11:26:51,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +53: [2023-04-29 11:26:51,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 11:26:51,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 11:26:51,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +40: [2023-04-29 11:26:51,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +28: [2023-04-29 11:26:51,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +61: [2023-04-29 11:26:51,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +61: [2023-04-29 11:26:51,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 11:26:51,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,538] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +50: [2023-04-29 11:26:51,538] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 11:26:51,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:51,539] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 11:26:51,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 11:26:51,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 11:26:51,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +49: [2023-04-29 11:26:51,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +49: [2023-04-29 11:26:51,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +53: [2023-04-29 11:26:51,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 11:26:51,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 11:26:51,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 11:26:51,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +19: [2023-04-29 11:26:51,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt. +19: [2023-04-29 11:26:51,541] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 158 +53: [2023-04-29 11:26:51,541] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +21: [2023-04-29 11:26:51,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 4: [2023-04-29 11:26:51,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +53: [2023-04-29 11:26:51,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 11:26:51,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt. +39: [2023-04-29 11:26:51,542] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 316 +50: [2023-04-29 11:26:51,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 11:26:51,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 11:26:51,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,543] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt. +40: [2023-04-29 11:26:51,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +20: [2023-04-29 11:26:51,543] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 4: [2023-04-29 11:26:51,544] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 32 + 4: [2023-04-29 11:26:51,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +40: [2023-04-29 11:26:51,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +40: [2023-04-29 11:26:51,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +50: [2023-04-29 11:26:51,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 11:26:51,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 11:26:51,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 11:26:51,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 11:26:51,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 11:26:51,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +26: [2023-04-29 11:26:51,545] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +49: [2023-04-29 11:26:51,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +50: [2023-04-29 11:26:51,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 11:26:51,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 11:26:51,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +47: [2023-04-29 11:26:51,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt... +47: [2023-04-29 11:26:51,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt... +47: [2023-04-29 11:26:51,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt... +47: [2023-04-29 11:26:51,546] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt... +42: [2023-04-29 11:26:51,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 11:26:51,547] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 11:26:51,548] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +19: [2023-04-29 11:26:51,549] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 158 +50: [2023-04-29 11:26:51,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 11:26:51,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 11:26:51,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 11:26:51,549] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +39: [2023-04-29 11:26:51,549] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 316 +42: [2023-04-29 11:26:51,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +59: [2023-04-29 11:26:51,551] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 4: [2023-04-29 11:26:51,551] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 32 + 4: [2023-04-29 11:26:51,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +44: [2023-04-29 11:26:51,551] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 11:26:51,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 11:26:51,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 11:26:51,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +32: [2023-04-29 11:26:51,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 11:26:51,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +46: [2023-04-29 11:26:51,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +46: [2023-04-29 11:26:51,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +32: [2023-04-29 11:26:51,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 11:26:51,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 4: [2023-04-29 11:26:51,552] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 5: [2023-04-29 11:26:51,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 11:26:51,552] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt. +23: [2023-04-29 11:26:51,553] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 188 +46: [2023-04-29 11:26:51,553] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +26: [2023-04-29 11:26:51,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +32: [2023-04-29 11:26:51,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +16: [2023-04-29 11:26:51,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +16: [2023-04-29 11:26:51,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +16: [2023-04-29 11:26:51,555] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +32: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +26: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +32: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 11:26:51,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +21: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +35: [2023-04-29 11:26:51,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +35: [2023-04-29 11:26:51,558] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +16: [2023-04-29 11:26:51,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +53: [2023-04-29 11:26:51,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 11:26:51,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 11:26:51,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 11:26:51,557] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 11:26:51,557] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 11:26:51,554] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +59: [2023-04-29 11:26:51,556] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 11:26:51,559] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 11:26:51,558] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +35: [2023-04-29 11:26:51,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +26: [2023-04-29 11:26:51,559] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +21: [2023-04-29 11:26:51,560] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 11:26:51,560] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 188 + 2: [2023-04-29 11:26:51,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +61: [2023-04-29 11:26:51,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 11:26:51,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:51,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 2: [2023-04-29 11:26:51,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +35: [2023-04-29 11:26:51,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 2: [2023-04-29 11:26:51,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... + 2: [2023-04-29 11:26:51,561] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +27: [2023-04-29 11:26:51,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +53: [2023-04-29 11:26:51,561] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +35: [2023-04-29 11:26:51,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 11:26:51,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 11:26:51,563] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +18: [2023-04-29 11:26:51,563] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 11:26:51,564] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +21: [2023-04-29 11:26:51,565] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 11:26:51,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +53: [2023-04-29 11:26:51,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +21: [2023-04-29 11:26:51,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +35: [2023-04-29 11:26:51,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 11:26:51,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:51,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt... + 1: [2023-04-29 11:26:51,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt... + 1: [2023-04-29 11:26:51,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt... + 1: [2023-04-29 11:26:51,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt... +35: [2023-04-29 11:26:51,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +30: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +42: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +42: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +61: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +35: [2023-04-29 11:26:51,567] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt... +61: [2023-04-29 11:26:51,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 11:26:51,568] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +30: [2023-04-29 11:26:51,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +61: [2023-04-29 11:26:51,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 11:26:51,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 11:26:51,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt. +61: [2023-04-29 11:26:51,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 11:26:51,568] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 506 +61: [2023-04-29 11:26:51,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +27: [2023-04-29 11:26:51,568] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +53: [2023-04-29 11:26:51,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:51,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +24: [2023-04-29 11:26:51,569] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +42: [2023-04-29 11:26:51,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,570] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +42: [2023-04-29 11:26:51,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +27: [2023-04-29 11:26:51,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +18: [2023-04-29 11:26:51,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 11:26:51,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +42: [2023-04-29 11:26:51,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 11:26:51,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt. +42: [2023-04-29 11:26:51,571] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 11:26:51,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 11:26:51,571] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 318 +11: [2023-04-29 11:26:51,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +11: [2023-04-29 11:26:51,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +42: [2023-04-29 11:26:51,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +11: [2023-04-29 11:26:51,571] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +11: [2023-04-29 11:26:51,572] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +30: [2023-04-29 11:26:51,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 11:26:51,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +44: [2023-04-29 11:26:51,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +30: [2023-04-29 11:26:51,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 11:26:51,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 11:26:51,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 11:26:51,574] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 5: [2023-04-29 11:26:51,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +24: [2023-04-29 11:26:51,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +27: [2023-04-29 11:26:51,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +53: [2023-04-29 11:26:51,574] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +36: [2023-04-29 11:26:51,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 11:26:51,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 11:26:51,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 11:26:51,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 11:26:51,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +27: [2023-04-29 11:26:51,576] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +43: [2023-04-29 11:26:51,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt. +27: [2023-04-29 11:26:51,576] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +44: [2023-04-29 11:26:51,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 11:26:51,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 11:26:51,577] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 344 +24: [2023-04-29 11:26:51,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,577] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +57: [2023-04-29 11:26:51,577] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +39: [2023-04-29 11:26:51,578] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 318 +36: [2023-04-29 11:26:51,578] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 11:26:51,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +52: [2023-04-29 11:26:51,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt... +52: [2023-04-29 11:26:51,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt... +52: [2023-04-29 11:26:51,579] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt... +42: [2023-04-29 11:26:51,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 11:26:51,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt... +42: [2023-04-29 11:26:51,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 11:26:51,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 11:26:51,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +44: [2023-04-29 11:26:51,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 11:26:51,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 11:26:51,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 11:26:51,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +42: [2023-04-29 11:26:51,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +42: [2023-04-29 11:26:51,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 11:26:51,580] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 11:26:51,580] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 11:26:51,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 11:26:51,581] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 11:26:51,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt... +41: [2023-04-29 11:26:51,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt... +41: [2023-04-29 11:26:51,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt... +41: [2023-04-29 11:26:51,581] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt... +27: [2023-04-29 11:26:51,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +43: [2023-04-29 11:26:51,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt. + 7: [2023-04-29 11:26:51,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +43: [2023-04-29 11:26:51,582] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 350 +36: [2023-04-29 11:26:51,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. + 7: [2023-04-29 11:26:51,582] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +36: [2023-04-29 11:26:51,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +57: [2023-04-29 11:26:51,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +24: [2023-04-29 11:26:51,582] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +62: [2023-04-29 11:26:51,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt. +52: [2023-04-29 11:26:51,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +62: [2023-04-29 11:26:51,583] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 496 +24: [2023-04-29 11:26:51,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_20-model_01-model_states.pt. +46: [2023-04-29 11:26:51,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +57: [2023-04-29 11:26:51,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +53: [2023-04-29 11:26:51,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt... +53: [2023-04-29 11:26:51,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt... +46: [2023-04-29 11:26:51,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +46: [2023-04-29 11:26:51,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 11:26:51,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt... +53: [2023-04-29 11:26:51,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt... +43: [2023-04-29 11:26:51,585] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 344 +16: [2023-04-29 11:26:51,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +36: [2023-04-29 11:26:51,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +44: [2023-04-29 11:26:51,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +36: [2023-04-29 11:26:51,585] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +44: [2023-04-29 11:26:51,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 11:26:51,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 11:26:51,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +44: [2023-04-29 11:26:51,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt. +42: [2023-04-29 11:26:51,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,587] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 38 +24: [2023-04-29 11:26:51,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +36: [2023-04-29 11:26:51,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +52: [2023-04-29 11:26:51,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +46: [2023-04-29 11:26:51,588] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 11:26:51,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +43: [2023-04-29 11:26:51,589] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 350 +57: [2023-04-29 11:26:51,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +57: [2023-04-29 11:26:51,589] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +16: [2023-04-29 11:26:51,589] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +57: [2023-04-29 11:26:51,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +13: [2023-04-29 11:26:51,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 11:26:51,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 11:26:51,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +61: [2023-04-29 11:26:51,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt... +61: [2023-04-29 11:26:51,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt... +57: [2023-04-29 11:26:51,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +59: [2023-04-29 11:26:51,604] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 11:26:51,598] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 11:26:51,597] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 84 +18: [2023-04-29 11:26:51,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +18: [2023-04-29 11:26:51,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +22: [2023-04-29 11:26:51,597] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 11:26:51,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +46: [2023-04-29 11:26:51,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 11:26:51,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +28: [2023-04-29 11:26:51,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt... +28: [2023-04-29 11:26:51,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt... +28: [2023-04-29 11:26:51,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt... + 2: [2023-04-29 11:26:51,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 11:26:51,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 11:26:51,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 2: [2023-04-29 11:26:51,632] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +33: [2023-04-29 11:26:51,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt. +44: [2023-04-29 11:26:51,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt... + 4: [2023-04-29 11:26:51,593] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 38 +30: [2023-04-29 11:26:51,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +30: [2023-04-29 11:26:51,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +35: [2023-04-29 11:26:51,625] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 11:26:51,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... + 7: [2023-04-29 11:26:51,604] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:51,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +50: [2023-04-29 11:26:51,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt... + 6: [2023-04-29 11:26:51,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +32: [2023-04-29 11:26:51,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt... +32: [2023-04-29 11:26:51,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt... +16: [2023-04-29 11:26:51,590] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +26: [2023-04-29 11:26:51,616] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +23: [2023-04-29 11:26:51,621] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt. +61: [2023-04-29 11:26:51,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt... +57: [2023-04-29 11:26:51,595] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +59: [2023-04-29 11:26:51,608] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +13: [2023-04-29 11:26:51,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 11:26:51,603] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 80 +18: [2023-04-29 11:26:51,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +22: [2023-04-29 11:26:51,600] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +24: [2023-04-29 11:26:51,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +42: [2023-04-29 11:26:51,592] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +28: [2023-04-29 11:26:51,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt... + 2: [2023-04-29 11:26:51,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 2: [2023-04-29 11:26:51,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +33: [2023-04-29 11:26:51,614] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 264 +44: [2023-04-29 11:26:51,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt... +44: [2023-04-29 11:26:51,630] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt... + 4: [2023-04-29 11:26:51,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt. +35: [2023-04-29 11:26:51,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 11:26:51,594] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:51,609] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +50: [2023-04-29 11:26:51,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt... +50: [2023-04-29 11:26:51,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt... + 6: [2023-04-29 11:26:51,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +16: [2023-04-29 11:26:51,593] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +61: [2023-04-29 11:26:51,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt... +59: [2023-04-29 11:26:51,623] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 11:26:51,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 11:26:51,604] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 82 +18: [2023-04-29 11:26:51,615] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +22: [2023-04-29 11:26:51,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +42: [2023-04-29 11:26:51,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt... + 2: [2023-04-29 11:26:51,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +33: [2023-04-29 11:26:51,621] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 264 +44: [2023-04-29 11:26:51,631] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt... + 4: [2023-04-29 11:26:51,629] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 36 +30: [2023-04-29 11:26:51,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +35: [2023-04-29 11:26:51,639] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +52: [2023-04-29 11:26:51,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,614] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:51,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +50: [2023-04-29 11:26:51,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt... + 6: [2023-04-29 11:26:51,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +16: [2023-04-29 11:26:51,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt. +23: [2023-04-29 11:26:51,621] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 184 +59: [2023-04-29 11:26:51,628] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +13: [2023-04-29 11:26:51,602] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +10: [2023-04-29 11:26:51,613] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 86 +18: [2023-04-29 11:26:51,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 11:26:51,605] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +42: [2023-04-29 11:26:51,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt... + 2: [2023-04-29 11:26:51,640] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +33: [2023-04-29 11:26:51,629] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt. +30: [2023-04-29 11:26:51,611] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +35: [2023-04-29 11:26:51,641] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 11:26:51,599] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... + 7: [2023-04-29 11:26:51,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt... +11: [2023-04-29 11:26:51,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 6: [2023-04-29 11:26:51,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +16: [2023-04-29 11:26:51,620] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 128 +23: [2023-04-29 11:26:51,628] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 184 +59: [2023-04-29 11:26:51,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 11:26:51,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +18: [2023-04-29 11:26:51,646] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 11:26:51,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +42: [2023-04-29 11:26:51,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt... +42: [2023-04-29 11:26:51,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt... +33: [2023-04-29 11:26:51,630] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 270 + 4: [2023-04-29 11:26:51,638] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 36 +30: [2023-04-29 11:26:51,641] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +52: [2023-04-29 11:26:51,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... + 7: [2023-04-29 11:26:51,620] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt. + 6: [2023-04-29 11:26:51,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +16: [2023-04-29 11:26:51,629] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 128 +59: [2023-04-29 11:26:51,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +13: [2023-04-29 11:26:51,610] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +18: [2023-04-29 11:26:51,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 11:26:51,648] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 11:26:51,610] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +33: [2023-04-29 11:26:51,631] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt. + 4: [2023-04-29 11:26:51,638] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt. +30: [2023-04-29 11:26:51,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +35: [2023-04-29 11:26:51,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... + 7: [2023-04-29 11:26:51,620] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 60 + 6: [2023-04-29 11:26:51,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +16: [2023-04-29 11:26:51,644] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +59: [2023-04-29 11:26:51,635] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +13: [2023-04-29 11:26:51,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +18: [2023-04-29 11:26:51,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt... +18: [2023-04-29 11:26:51,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt... +18: [2023-04-29 11:26:51,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt... +18: [2023-04-29 11:26:51,649] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt... +22: [2023-04-29 11:26:51,616] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +33: [2023-04-29 11:26:51,631] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 266 + 4: [2023-04-29 11:26:51,638] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 34 +30: [2023-04-29 11:26:51,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +35: [2023-04-29 11:26:51,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,627] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 60 + 6: [2023-04-29 11:26:51,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +59: [2023-04-29 11:26:51,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +13: [2023-04-29 11:26:51,628] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +22: [2023-04-29 11:26:51,618] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +33: [2023-04-29 11:26:51,638] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 270 + 4: [2023-04-29 11:26:51,645] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 34 +30: [2023-04-29 11:26:51,644] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +35: [2023-04-29 11:26:51,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,645] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 11:26:51,636] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +33: [2023-04-29 11:26:51,640] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 266 +30: [2023-04-29 11:26:51,648] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +32: [2023-04-29 11:26:51,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt... +32: [2023-04-29 11:26:51,615] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt... +26: [2023-04-29 11:26:51,623] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +26: [2023-04-29 11:26:51,627] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 11:26:51,634] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +26: [2023-04-29 11:26:51,635] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 11:26:51,640] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +26: [2023-04-29 11:26:51,643] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +26: [2023-04-29 11:26:51,647] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +35: [2023-04-29 11:26:51,651] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +16: [2023-04-29 11:26:51,651] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +46: [2023-04-29 11:26:51,652] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +29: [2023-04-29 11:26:51,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +29: [2023-04-29 11:26:51,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +29: [2023-04-29 11:26:51,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +46: [2023-04-29 11:26:51,654] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +11: [2023-04-29 11:26:51,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +43: [2023-04-29 11:26:51,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +43: [2023-04-29 11:26:51,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +43: [2023-04-29 11:26:51,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +33: [2023-04-29 11:26:51,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +43: [2023-04-29 11:26:51,654] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +33: [2023-04-29 11:26:51,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +33: [2023-04-29 11:26:51,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +29: [2023-04-29 11:26:51,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +35: [2023-04-29 11:26:51,655] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +33: [2023-04-29 11:26:51,655] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +46: [2023-04-29 11:26:51,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 11:26:51,656] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_00-model_states.pt. +46: [2023-04-29 11:26:51,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +11: [2023-04-29 11:26:51,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +35: [2023-04-29 11:26:51,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +29: [2023-04-29 11:26:51,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 11:26:51,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +35: [2023-04-29 11:26:51,660] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +16: [2023-04-29 11:26:51,660] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt. +16: [2023-04-29 11:26:51,660] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 130 +29: [2023-04-29 11:26:51,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +29: [2023-04-29 11:26:51,661] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +46: [2023-04-29 11:26:51,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +51: [2023-04-29 11:26:51,662] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt. +51: [2023-04-29 11:26:51,663] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 414 +35: [2023-04-29 11:26:51,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 11:26:51,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +46: [2023-04-29 11:26:51,663] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 11:26:51,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt... +35: [2023-04-29 11:26:51,664] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +35: [2023-04-29 11:26:51,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 11:26:51,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 11:26:51,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 11:26:51,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 11:26:51,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +35: [2023-04-29 11:26:51,669] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +16: [2023-04-29 11:26:51,667] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 130 +35: [2023-04-29 11:26:51,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 11:26:51,670] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 11:26:51,670] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 414 +35: [2023-04-29 11:26:51,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +16: [2023-04-29 11:26:51,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 11:26:51,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 11:26:51,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +39: [2023-04-29 11:26:51,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +39: [2023-04-29 11:26:51,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +39: [2023-04-29 11:26:51,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +39: [2023-04-29 11:26:51,672] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. + 7: [2023-04-29 11:26:51,676] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +19: [2023-04-29 11:26:51,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt. +19: [2023-04-29 11:26:51,677] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 156 +23: [2023-04-29 11:26:51,677] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt. +23: [2023-04-29 11:26:51,677] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 190 +16: [2023-04-29 11:26:51,678] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt. +16: [2023-04-29 11:26:51,678] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 132 +24: [2023-04-29 11:26:51,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 11:26:51,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 11:26:51,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 11:26:51,679] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +16: [2023-04-29 11:26:51,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +43: [2023-04-29 11:26:51,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +16: [2023-04-29 11:26:51,680] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt. +33: [2023-04-29 11:26:51,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +16: [2023-04-29 11:26:51,680] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +16: [2023-04-29 11:26:51,681] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 134 +43: [2023-04-29 11:26:51,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 11:26:51,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt. +16: [2023-04-29 11:26:51,681] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +33: [2023-04-29 11:26:51,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 11:26:51,681] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 500 +11: [2023-04-29 11:26:51,681] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +43: [2023-04-29 11:26:51,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +35: [2023-04-29 11:26:51,682] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 11:26:51,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 11:26:51,683] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 11:26:51,683] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 11:26:51,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +43: [2023-04-29 11:26:51,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +22: [2023-04-29 11:26:51,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:51,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:51,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:51,653] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:51,659] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 11:26:51,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 11:26:51,662] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 11:26:51,663] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 11:26:51,684] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 11:26:51,684] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +43: [2023-04-29 11:26:51,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 11:26:51,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +11: [2023-04-29 11:26:51,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +11: [2023-04-29 11:26:51,685] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 11:26:51,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 11:26:51,685] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 190 +43: [2023-04-29 11:26:51,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 7: [2023-04-29 11:26:51,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... +24: [2023-04-29 11:26:51,685] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +43: [2023-04-29 11:26:51,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +43: [2023-04-29 11:26:51,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +33: [2023-04-29 11:26:51,686] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 11:26:51,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt. +56: [2023-04-29 11:26:51,686] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 452 +33: [2023-04-29 11:26:51,686] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +19: [2023-04-29 11:26:51,687] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 156 +33: [2023-04-29 11:26:51,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +24: [2023-04-29 11:26:51,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +33: [2023-04-29 11:26:51,687] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +24: [2023-04-29 11:26:51,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +33: [2023-04-29 11:26:51,687] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +16: [2023-04-29 11:26:51,687] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 132 +33: [2023-04-29 11:26:51,688] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +13: [2023-04-29 11:26:51,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt... +13: [2023-04-29 11:26:51,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt... +13: [2023-04-29 11:26:51,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt... +13: [2023-04-29 11:26:51,666] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt... +11: [2023-04-29 11:26:51,689] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 7: [2023-04-29 11:26:51,690] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_00-model_states.pt. +33: [2023-04-29 11:26:51,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +33: [2023-04-29 11:26:51,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +33: [2023-04-29 11:26:51,691] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +16: [2023-04-29 11:26:51,691] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 134 +33: [2023-04-29 11:26:51,692] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +30: [2023-04-29 11:26:51,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 11:26:51,665] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 11:26:51,666] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 11:26:51,692] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt. + 7: [2023-04-29 11:26:51,693] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 58 +11: [2023-04-29 11:26:51,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +11: [2023-04-29 11:26:51,694] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 7: [2023-04-29 11:26:51,696] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt... + 7: [2023-04-29 11:26:51,701] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 58 +33: [2023-04-29 11:26:51,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +33: [2023-04-29 11:26:51,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +33: [2023-04-29 11:26:51,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +33: [2023-04-29 11:26:51,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +39: [2023-04-29 11:26:51,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 11:26:51,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 11:26:51,704] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +43: [2023-04-29 11:26:51,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +43: [2023-04-29 11:26:51,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +43: [2023-04-29 11:26:51,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +43: [2023-04-29 11:26:51,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +62: [2023-04-29 11:26:51,704] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +39: [2023-04-29 11:26:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 11:26:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 11:26:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +25: [2023-04-29 11:26:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +25: [2023-04-29 11:26:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +62: [2023-04-29 11:26:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +25: [2023-04-29 11:26:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +62: [2023-04-29 11:26:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +25: [2023-04-29 11:26:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +62: [2023-04-29 11:26:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. + 8: [2023-04-29 11:26:51,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 8: [2023-04-29 11:26:51,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 8: [2023-04-29 11:26:51,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 8: [2023-04-29 11:26:51,706] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +39: [2023-04-29 11:26:51,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +39: [2023-04-29 11:26:51,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +39: [2023-04-29 11:26:51,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +39: [2023-04-29 11:26:51,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +39: [2023-04-29 11:26:51,707] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +39: [2023-04-29 11:26:51,707] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +51: [2023-04-29 11:26:51,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt. +51: [2023-04-29 11:26:51,708] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 412 +35: [2023-04-29 11:26:51,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt... +35: [2023-04-29 11:26:51,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt... +35: [2023-04-29 11:26:51,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt... +35: [2023-04-29 11:26:51,709] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt... + 6: [2023-04-29 11:26:51,709] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 11:26:51,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 11:26:51,710] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +39: [2023-04-29 11:26:51,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +39: [2023-04-29 11:26:51,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +39: [2023-04-29 11:26:51,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +39: [2023-04-29 11:26:51,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. + 9: [2023-04-29 11:26:51,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt. + 9: [2023-04-29 11:26:51,711] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 72 +39: [2023-04-29 11:26:51,711] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt. +39: [2023-04-29 11:26:51,712] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 314 +12: [2023-04-29 11:26:51,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 11:26:51,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 11:26:51,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 11:26:51,713] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 11:26:51,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 11:26:51,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 11:26:51,714] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +51: [2023-04-29 11:26:51,714] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 412 +33: [2023-04-29 11:26:51,715] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt. + 6: [2023-04-29 11:26:51,715] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +33: [2023-04-29 11:26:51,715] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 268 +62: [2023-04-29 11:26:51,716] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 496 +29: [2023-04-29 11:26:51,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,716] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt. + 6: [2023-04-29 11:26:51,717] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 52 +14: [2023-04-29 11:26:51,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,717] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 11:26:51,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +18: [2023-04-29 11:26:51,717] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 9: [2023-04-29 11:26:51,717] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 72 +62: [2023-04-29 11:26:51,719] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 500 +12: [2023-04-29 11:26:51,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 11:26:51,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 11:26:51,719] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +39: [2023-04-29 11:26:51,720] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 314 +14: [2023-04-29 11:26:51,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 11:26:51,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 11:26:51,720] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 11:26:51,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 11:26:51,720] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +33: [2023-04-29 11:26:51,721] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 268 +29: [2023-04-29 11:26:51,721] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 11:26:51,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 11:26:51,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +14: [2023-04-29 11:26:51,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +54: [2023-04-29 11:26:51,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +54: [2023-04-29 11:26:51,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +54: [2023-04-29 11:26:51,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. + 6: [2023-04-29 11:26:51,724] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +30: [2023-04-29 11:26:51,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +54: [2023-04-29 11:26:51,724] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. + 6: [2023-04-29 11:26:51,725] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 52 +14: [2023-04-29 11:26:51,725] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +18: [2023-04-29 11:26:51,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +26: [2023-04-29 11:26:51,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +26: [2023-04-29 11:26:51,727] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 11:26:51,727] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +29: [2023-04-29 11:26:51,728] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:51,723] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 11:26:51,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 11:26:51,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 11:26:51,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +30: [2023-04-29 11:26:51,729] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +29: [2023-04-29 11:26:51,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +26: [2023-04-29 11:26:51,729] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 11:26:51,730] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +26: [2023-04-29 11:26:51,730] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +20: [2023-04-29 11:26:51,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 11:26:51,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 11:26:51,731] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 11:26:51,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +62: [2023-04-29 11:26:51,732] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 11:26:51,732] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 11:26:51,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +63: [2023-04-29 11:26:51,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +63: [2023-04-29 11:26:51,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +63: [2023-04-29 11:26:51,733] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +25: [2023-04-29 11:26:51,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +26: [2023-04-29 11:26:51,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 11:26:51,734] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +20: [2023-04-29 11:26:51,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +62: [2023-04-29 11:26:51,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 11:26:51,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +22: [2023-04-29 11:26:51,735] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 11:26:51,735] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +62: [2023-04-29 11:26:51,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 11:26:51,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +20: [2023-04-29 11:26:51,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +38: [2023-04-29 11:26:51,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt. +38: [2023-04-29 11:26:51,736] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 304 +26: [2023-04-29 11:26:51,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 11:26:51,736] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 11:26:51,736] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 11:26:51,737] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +62: [2023-04-29 11:26:51,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +62: [2023-04-29 11:26:51,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +62: [2023-04-29 11:26:51,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +62: [2023-04-29 11:26:51,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +22: [2023-04-29 11:26:51,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +62: [2023-04-29 11:26:51,738] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +25: [2023-04-29 11:26:51,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:51,739] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 11:26:51,739] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +62: [2023-04-29 11:26:51,740] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... + 6: [2023-04-29 11:26:51,741] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt. + 6: [2023-04-29 11:26:51,742] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 50 + 8: [2023-04-29 11:26:51,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 8: [2023-04-29 11:26:51,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 11:26:51,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt... +30: [2023-04-29 11:26:51,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt... +30: [2023-04-29 11:26:51,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt... +30: [2023-04-29 11:26:51,742] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt... +62: [2023-04-29 11:26:51,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +62: [2023-04-29 11:26:51,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +62: [2023-04-29 11:26:51,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +62: [2023-04-29 11:26:51,743] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +38: [2023-04-29 11:26:51,744] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 304 + 8: [2023-04-29 11:26:51,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +30: [2023-04-29 11:26:51,745] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 6: [2023-04-29 11:26:51,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt. + 6: [2023-04-29 11:26:51,747] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 48 +15: [2023-04-29 11:26:51,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 11:26:51,747] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +43: [2023-04-29 11:26:51,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt... +43: [2023-04-29 11:26:51,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt... +43: [2023-04-29 11:26:51,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt... +43: [2023-04-29 11:26:51,748] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt... +15: [2023-04-29 11:26:51,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 11:26:51,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +54: [2023-04-29 11:26:51,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +51: [2023-04-29 11:26:51,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +51: [2023-04-29 11:26:51,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +33: [2023-04-29 11:26:51,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt... + 6: [2023-04-29 11:26:51,750] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 50 +24: [2023-04-29 11:26:51,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 11:26:51,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +33: [2023-04-29 11:26:51,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt... +33: [2023-04-29 11:26:51,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt... +33: [2023-04-29 11:26:51,746] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt... +54: [2023-04-29 11:26:51,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 11:26:51,750] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 11:26:51,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +51: [2023-04-29 11:26:51,746] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +54: [2023-04-29 11:26:51,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +38: [2023-04-29 11:26:51,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +38: [2023-04-29 11:26:51,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +38: [2023-04-29 11:26:51,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +38: [2023-04-29 11:26:51,752] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +54: [2023-04-29 11:26:51,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +15: [2023-04-29 11:26:51,753] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +54: [2023-04-29 11:26:51,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +15: [2023-04-29 11:26:51,754] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 11:26:51,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 11:26:51,755] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 48 +23: [2023-04-29 11:26:51,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +23: [2023-04-29 11:26:51,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 5: [2023-04-29 11:26:51,755] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 11:26:51,755] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +54: [2023-04-29 11:26:51,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +23: [2023-04-29 11:26:51,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 5: [2023-04-29 11:26:51,756] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +54: [2023-04-29 11:26:51,756] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +15: [2023-04-29 11:26:51,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +54: [2023-04-29 11:26:51,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +54: [2023-04-29 11:26:51,757] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... + 5: [2023-04-29 11:26:51,758] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 11:26:51,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt. +24: [2023-04-29 11:26:51,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +63: [2023-04-29 11:26:51,758] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 504 + 5: [2023-04-29 11:26:51,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +39: [2023-04-29 11:26:51,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt... +39: [2023-04-29 11:26:51,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt... +39: [2023-04-29 11:26:51,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt... +39: [2023-04-29 11:26:51,759] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt... +31: [2023-04-29 11:26:51,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +31: [2023-04-29 11:26:51,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +31: [2023-04-29 11:26:51,759] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +31: [2023-04-29 11:26:51,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +63: [2023-04-29 11:26:51,760] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 11:26:51,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +24: [2023-04-29 11:26:51,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 11:26:51,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 11:26:51,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +63: [2023-04-29 11:26:51,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 11:26:51,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +60: [2023-04-29 11:26:51,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +60: [2023-04-29 11:26:51,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +63: [2023-04-29 11:26:51,762] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +60: [2023-04-29 11:26:51,762] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +17: [2023-04-29 11:26:51,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 11:26:51,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +31: [2023-04-29 11:26:51,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 11:26:51,764] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 11:26:51,764] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +63: [2023-04-29 11:26:51,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 11:26:51,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +31: [2023-04-29 11:26:51,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 11:26:51,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +63: [2023-04-29 11:26:51,765] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +31: [2023-04-29 11:26:51,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 11:26:51,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +63: [2023-04-29 11:26:51,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +31: [2023-04-29 11:26:51,765] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 11:26:51,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +63: [2023-04-29 11:26:51,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +63: [2023-04-29 11:26:51,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +63: [2023-04-29 11:26:51,766] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +54: [2023-04-29 11:26:51,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +54: [2023-04-29 11:26:51,766] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +17: [2023-04-29 11:26:51,767] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 11:26:51,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 11:26:51,768] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 11:26:51,771] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +54: [2023-04-29 11:26:51,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +54: [2023-04-29 11:26:51,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +54: [2023-04-29 11:26:51,773] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +54: [2023-04-29 11:26:51,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +51: [2023-04-29 11:26:51,774] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 11:26:51,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt. +51: [2023-04-29 11:26:51,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 11:26:51,775] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 450 +51: [2023-04-29 11:26:51,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 11:26:51,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 11:26:51,775] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +21: [2023-04-29 11:26:51,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 11:26:51,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 11:26:51,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +51: [2023-04-29 11:26:51,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 11:26:51,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 11:26:51,776] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +51: [2023-04-29 11:26:51,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +51: [2023-04-29 11:26:51,776] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +51: [2023-04-29 11:26:51,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +51: [2023-04-29 11:26:51,777] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +32: [2023-04-29 11:26:51,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +32: [2023-04-29 11:26:51,777] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +21: [2023-04-29 11:26:51,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +55: [2023-04-29 11:26:51,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt. +55: [2023-04-29 11:26:51,779] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 442 +51: [2023-04-29 11:26:51,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +51: [2023-04-29 11:26:51,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +51: [2023-04-29 11:26:51,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +51: [2023-04-29 11:26:51,779] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +32: [2023-04-29 11:26:51,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +32: [2023-04-29 11:26:51,780] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +21: [2023-04-29 11:26:51,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +38: [2023-04-29 11:26:51,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 11:26:51,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 11:26:51,781] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +23: [2023-04-29 11:26:51,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 11:26:51,781] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +38: [2023-04-29 11:26:51,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 11:26:51,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 11:26:51,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +23: [2023-04-29 11:26:51,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 11:26:51,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +38: [2023-04-29 11:26:51,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 11:26:51,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +38: [2023-04-29 11:26:51,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +38: [2023-04-29 11:26:51,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 11:26:51,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +38: [2023-04-29 11:26:51,782] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +51: [2023-04-29 11:26:51,782] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt. +51: [2023-04-29 11:26:51,783] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 408 +23: [2023-04-29 11:26:51,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +23: [2023-04-29 11:26:51,783] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +14: [2023-04-29 11:26:51,783] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 11:26:51,784] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 11:26:51,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 11:26:51,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +38: [2023-04-29 11:26:51,784] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt. +38: [2023-04-29 11:26:51,785] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 308 +38: [2023-04-29 11:26:51,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +38: [2023-04-29 11:26:51,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +38: [2023-04-29 11:26:51,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +55: [2023-04-29 11:26:51,785] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 442 +38: [2023-04-29 11:26:51,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +55: [2023-04-29 11:26:51,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +55: [2023-04-29 11:26:51,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +55: [2023-04-29 11:26:51,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +55: [2023-04-29 11:26:51,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +14: [2023-04-29 11:26:51,786] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 11:26:51,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 11:26:51,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +51: [2023-04-29 11:26:51,791] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 408 +38: [2023-04-29 11:26:51,792] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 308 +58: [2023-04-29 11:26:51,792] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt. +58: [2023-04-29 11:26:51,793] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 470 +60: [2023-04-29 11:26:51,793] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +56: [2023-04-29 11:26:51,794] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 450 + 0: [2023-04-29 11:26:51,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt. +60: [2023-04-29 11:26:51,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 11:26:51,794] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 11:26:51,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,794] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 6 +60: [2023-04-29 11:26:51,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 11:26:51,794] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +38: [2023-04-29 11:26:51,795] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt. +38: [2023-04-29 11:26:51,795] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 310 +56: [2023-04-29 11:26:51,796] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 452 +14: [2023-04-29 11:26:51,796] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +60: [2023-04-29 11:26:51,798] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +60: [2023-04-29 11:26:51,798] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +14: [2023-04-29 11:26:51,799] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +29: [2023-04-29 11:26:51,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt... +29: [2023-04-29 11:26:51,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt... +29: [2023-04-29 11:26:51,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt... +29: [2023-04-29 11:26:51,800] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt... +58: [2023-04-29 11:26:51,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +58: [2023-04-29 11:26:51,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +58: [2023-04-29 11:26:51,800] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +58: [2023-04-29 11:26:51,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. + 0: [2023-04-29 11:26:51,802] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 6 +38: [2023-04-29 11:26:51,802] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 310 +25: [2023-04-29 11:26:51,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +48: [2023-04-29 11:26:51,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt. +62: [2023-04-29 11:26:51,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt... +62: [2023-04-29 11:26:51,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt... +62: [2023-04-29 11:26:51,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt... +62: [2023-04-29 11:26:51,803] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt... +48: [2023-04-29 11:26:51,803] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 390 +20: [2023-04-29 11:26:51,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 11:26:51,801] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 11:26:51,804] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +38: [2023-04-29 11:26:51,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt. +36: [2023-04-29 11:26:51,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt. + 8: [2023-04-29 11:26:51,805] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +20: [2023-04-29 11:26:51,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +38: [2023-04-29 11:26:51,805] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 306 +36: [2023-04-29 11:26:51,805] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 292 +26: [2023-04-29 11:26:51,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +26: [2023-04-29 11:26:51,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +26: [2023-04-29 11:26:51,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 11:26:51,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +60: [2023-04-29 11:26:51,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +60: [2023-04-29 11:26:51,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +26: [2023-04-29 11:26:51,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +60: [2023-04-29 11:26:51,806] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +60: [2023-04-29 11:26:51,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +32: [2023-04-29 11:26:51,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 11:26:51,808] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 11:26:51,810] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 390 +25: [2023-04-29 11:26:51,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 11:26:51,810] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:51,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt... +22: [2023-04-29 11:26:51,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt... +22: [2023-04-29 11:26:51,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt... +22: [2023-04-29 11:26:51,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt... +27: [2023-04-29 11:26:51,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt. +27: [2023-04-29 11:26:51,811] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 218 +63: [2023-04-29 11:26:51,811] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt... +63: [2023-04-29 11:26:51,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt... +63: [2023-04-29 11:26:51,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt... +63: [2023-04-29 11:26:51,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt... +25: [2023-04-29 11:26:51,811] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +49: [2023-04-29 11:26:51,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +49: [2023-04-29 11:26:51,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +32: [2023-04-29 11:26:51,812] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +38: [2023-04-29 11:26:51,812] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 306 +32: [2023-04-29 11:26:51,812] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 11:26:51,812] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 292 +55: [2023-04-29 11:26:51,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +32: [2023-04-29 11:26:51,813] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +49: [2023-04-29 11:26:51,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +32: [2023-04-29 11:26:51,813] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 11:26:51,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +32: [2023-04-29 11:26:51,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +32: [2023-04-29 11:26:51,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +32: [2023-04-29 11:26:51,814] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +25: [2023-04-29 11:26:51,815] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +32: [2023-04-29 11:26:51,816] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 11:26:51,817] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +32: [2023-04-29 11:26:51,817] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +55: [2023-04-29 11:26:51,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +27: [2023-04-29 11:26:51,818] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 218 +55: [2023-04-29 11:26:51,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +25: [2023-04-29 11:26:51,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +25: [2023-04-29 11:26:51,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +25: [2023-04-29 11:26:51,819] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 5: [2023-04-29 11:26:51,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 11:26:51,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +55: [2023-04-29 11:26:51,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +25: [2023-04-29 11:26:51,821] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +60: [2023-04-29 11:26:51,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +60: [2023-04-29 11:26:51,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +60: [2023-04-29 11:26:51,821] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. + 8: [2023-04-29 11:26:51,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +60: [2023-04-29 11:26:51,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt. +60: [2023-04-29 11:26:51,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +15: [2023-04-29 11:26:51,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +60: [2023-04-29 11:26:51,822] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 486 +24: [2023-04-29 11:26:51,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt... +24: [2023-04-29 11:26:51,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt... +24: [2023-04-29 11:26:51,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt... +24: [2023-04-29 11:26:51,822] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt... + 8: [2023-04-29 11:26:51,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,822] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 11:26:51,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,825] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt. + 9: [2023-04-29 11:26:51,825] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 76 + 8: [2023-04-29 11:26:51,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +58: [2023-04-29 11:26:51,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 11:26:51,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +58: [2023-04-29 11:26:51,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 11:26:51,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 11:26:51,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 11:26:51,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt. +56: [2023-04-29 11:26:51,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt. +58: [2023-04-29 11:26:51,829] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +17: [2023-04-29 11:26:51,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +56: [2023-04-29 11:26:51,829] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 448 +51: [2023-04-29 11:26:51,829] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 410 +31: [2023-04-29 11:26:51,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +56: [2023-04-29 11:26:51,830] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt. +60: [2023-04-29 11:26:51,830] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 486 +56: [2023-04-29 11:26:51,831] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 454 +58: [2023-04-29 11:26:51,831] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +58: [2023-04-29 11:26:51,831] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +58: [2023-04-29 11:26:51,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +58: [2023-04-29 11:26:51,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +58: [2023-04-29 11:26:51,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... + 0: [2023-04-29 11:26:51,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt. +32: [2023-04-29 11:26:51,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +32: [2023-04-29 11:26:51,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +32: [2023-04-29 11:26:51,832] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. + 0: [2023-04-29 11:26:51,832] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 0 + 9: [2023-04-29 11:26:51,832] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 76 +58: [2023-04-29 11:26:51,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... + 8: [2023-04-29 11:26:51,832] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 8: [2023-04-29 11:26:51,833] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 11:26:51,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 11:26:51,833] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 11:26:51,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +58: [2023-04-29 11:26:51,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. + 8: [2023-04-29 11:26:51,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +58: [2023-04-29 11:26:51,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +38: [2023-04-29 11:26:51,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt... +38: [2023-04-29 11:26:51,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt... + 8: [2023-04-29 11:26:51,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +58: [2023-04-29 11:26:51,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +38: [2023-04-29 11:26:51,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt... +38: [2023-04-29 11:26:51,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt... + 8: [2023-04-29 11:26:51,834] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +58: [2023-04-29 11:26:51,834] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +32: [2023-04-29 11:26:51,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +17: [2023-04-29 11:26:51,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +56: [2023-04-29 11:26:51,836] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 448 +58: [2023-04-29 11:26:51,836] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt. +58: [2023-04-29 11:26:51,837] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 466 +56: [2023-04-29 11:26:51,837] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 454 +17: [2023-04-29 11:26:51,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +51: [2023-04-29 11:26:51,838] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 410 + 0: [2023-04-29 11:26:51,839] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 0 +20: [2023-04-29 11:26:51,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +20: [2023-04-29 11:26:51,839] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +20: [2023-04-29 11:26:51,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +49: [2023-04-29 11:26:51,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +31: [2023-04-29 11:26:51,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +31: [2023-04-29 11:26:51,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +49: [2023-04-29 11:26:51,840] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +20: [2023-04-29 11:26:51,840] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +49: [2023-04-29 11:26:51,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 11:26:51,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 11:26:51,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt. +60: [2023-04-29 11:26:51,841] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 484 +60: [2023-04-29 11:26:51,841] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt. +60: [2023-04-29 11:26:51,842] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 480 +51: [2023-04-29 11:26:51,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt... +51: [2023-04-29 11:26:51,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt... +51: [2023-04-29 11:26:51,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt... +49: [2023-04-29 11:26:51,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 11:26:51,843] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt... +49: [2023-04-29 11:26:51,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 0: could not find arguments in the checkpoint ... + 0: checkpoint version 3.0 +36: [2023-04-29 11:26:51,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +36: [2023-04-29 11:26:51,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +36: [2023-04-29 11:26:51,844] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +49: [2023-04-29 11:26:51,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +49: [2023-04-29 11:26:51,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +54: [2023-04-29 11:26:51,845] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt. +49: [2023-04-29 11:26:51,845] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +54: [2023-04-29 11:26:51,846] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 438 +36: [2023-04-29 11:26:51,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +49: [2023-04-29 11:26:51,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +49: [2023-04-29 11:26:51,846] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 11:26:51,846] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +21: [2023-04-29 11:26:51,848] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +23: [2023-04-29 11:26:51,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 11:26:51,849] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +60: [2023-04-29 11:26:51,850] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 480 +60: [2023-04-29 11:26:51,851] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 484 +41: [2023-04-29 11:26:51,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +41: [2023-04-29 11:26:51,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +41: [2023-04-29 11:26:51,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +41: [2023-04-29 11:26:51,852] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +23: [2023-04-29 11:26:51,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +23: [2023-04-29 11:26:51,853] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 11:26:51,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 11:26:51,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 11:26:51,854] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +54: [2023-04-29 11:26:51,855] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 438 +23: [2023-04-29 11:26:51,855] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +23: [2023-04-29 11:26:51,856] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +58: [2023-04-29 11:26:51,856] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 466 +49: [2023-04-29 11:26:51,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +49: [2023-04-29 11:26:51,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +49: [2023-04-29 11:26:51,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +49: [2023-04-29 11:26:51,856] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. + 9: [2023-04-29 11:26:51,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt. + 9: [2023-04-29 11:26:51,857] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 78 +10: [2023-04-29 11:26:51,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +10: [2023-04-29 11:26:51,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +10: [2023-04-29 11:26:51,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +23: [2023-04-29 11:26:51,858] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +10: [2023-04-29 11:26:51,858] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +58: [2023-04-29 11:26:51,858] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 470 +23: [2023-04-29 11:26:51,859] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 3: [2023-04-29 11:26:51,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 3: [2023-04-29 11:26:51,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +27: [2023-04-29 11:26:51,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt. +27: [2023-04-29 11:26:51,862] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 216 + 3: [2023-04-29 11:26:51,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 3: [2023-04-29 11:26:51,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 9: [2023-04-29 11:26:51,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 9: [2023-04-29 11:26:51,864] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 9: [2023-04-29 11:26:51,865] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +20: [2023-04-29 11:26:51,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,866] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +20: [2023-04-29 11:26:51,866] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,867] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 78 +54: [2023-04-29 11:26:51,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt. +37: [2023-04-29 11:26:51,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt. +54: [2023-04-29 11:26:51,867] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 432 +37: [2023-04-29 11:26:51,867] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 298 +54: [2023-04-29 11:26:51,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt. +54: [2023-04-29 11:26:51,868] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 436 +48: [2023-04-29 11:26:51,868] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt. +27: [2023-04-29 11:26:51,869] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 216 +48: [2023-04-29 11:26:51,868] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 386 +36: [2023-04-29 11:26:51,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +36: [2023-04-29 11:26:51,871] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +36: [2023-04-29 11:26:51,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +36: [2023-04-29 11:26:51,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 11:26:51,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +12: [2023-04-29 11:26:51,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt... +12: [2023-04-29 11:26:51,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt... +12: [2023-04-29 11:26:51,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt... +12: [2023-04-29 11:26:51,872] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt... +36: [2023-04-29 11:26:51,872] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +20: [2023-04-29 11:26:51,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +36: [2023-04-29 11:26:51,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +36: [2023-04-29 11:26:51,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +36: [2023-04-29 11:26:51,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +20: [2023-04-29 11:26:51,873] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +62: [2023-04-29 11:26:51,873] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt. +62: [2023-04-29 11:26:51,873] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 498 +36: [2023-04-29 11:26:51,875] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 11:26:51,875] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 386 +54: [2023-04-29 11:26:51,875] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 432 +54: [2023-04-29 11:26:51,876] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 436 +36: [2023-04-29 11:26:51,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +36: [2023-04-29 11:26:51,876] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +36: [2023-04-29 11:26:51,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +36: [2023-04-29 11:26:51,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +36: [2023-04-29 11:26:51,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +36: [2023-04-29 11:26:51,876] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +37: [2023-04-29 11:26:51,877] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 298 +14: [2023-04-29 11:26:51,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt... +14: [2023-04-29 11:26:51,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt... +14: [2023-04-29 11:26:51,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt... +14: [2023-04-29 11:26:51,877] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt... +40: [2023-04-29 11:26:51,878] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt. +60: [2023-04-29 11:26:51,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt... +60: [2023-04-29 11:26:51,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt... +40: [2023-04-29 11:26:51,878] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 324 +60: [2023-04-29 11:26:51,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt... +60: [2023-04-29 11:26:51,878] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt... +63: [2023-04-29 11:26:51,878] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 508 +55: [2023-04-29 11:26:51,879] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 11:26:51,879] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 11:26:51,880] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt. +40: [2023-04-29 11:26:51,880] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 326 +55: [2023-04-29 11:26:51,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +63: [2023-04-29 11:26:51,882] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 510 +41: [2023-04-29 11:26:51,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +62: [2023-04-29 11:26:51,883] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 498 +54: [2023-04-29 11:26:51,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt... +54: [2023-04-29 11:26:51,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt... +54: [2023-04-29 11:26:51,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt... +41: [2023-04-29 11:26:51,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 11:26:51,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt... +41: [2023-04-29 11:26:51,883] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +55: [2023-04-29 11:26:51,884] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +10: [2023-04-29 11:26:51,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +55: [2023-04-29 11:26:51,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +63: [2023-04-29 11:26:51,886] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 506 +12: [2023-04-29 11:26:51,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +12: [2023-04-29 11:26:51,887] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +12: [2023-04-29 11:26:51,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 8: [2023-04-29 11:26:51,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +63: [2023-04-29 11:26:51,888] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 504 +12: [2023-04-29 11:26:51,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 3: [2023-04-29 11:26:51,889] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 11:26:51,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +14: [2023-04-29 11:26:51,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +62: [2023-04-29 11:26:51,890] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt. +62: [2023-04-29 11:26:51,890] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 502 +14: [2023-04-29 11:26:51,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +10: [2023-04-29 11:26:51,890] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 11:26:51,891] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +20: [2023-04-29 11:26:51,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt... +20: [2023-04-29 11:26:51,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt... +20: [2023-04-29 11:26:51,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt... +20: [2023-04-29 11:26:51,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt... + 3: [2023-04-29 11:26:51,891] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +10: [2023-04-29 11:26:51,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 11:26:51,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 3: [2023-04-29 11:26:51,892] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +10: [2023-04-29 11:26:51,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,893] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +32: [2023-04-29 11:26:51,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt... +32: [2023-04-29 11:26:51,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt... +32: [2023-04-29 11:26:51,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt... +32: [2023-04-29 11:26:51,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt... +55: [2023-04-29 11:26:51,894] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +26: [2023-04-29 11:26:51,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt... +26: [2023-04-29 11:26:51,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt... +26: [2023-04-29 11:26:51,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt... +26: [2023-04-29 11:26:51,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt... + 9: [2023-04-29 11:26:51,894] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 9: [2023-04-29 11:26:51,896] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +58: [2023-04-29 11:26:51,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt... +58: [2023-04-29 11:26:51,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt... +23: [2023-04-29 11:26:51,897] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt. +58: [2023-04-29 11:26:51,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt... +58: [2023-04-29 11:26:51,897] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt... +23: [2023-04-29 11:26:51,897] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 186 +55: [2023-04-29 11:26:51,898] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +62: [2023-04-29 11:26:51,898] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 502 +40: [2023-04-29 11:26:51,901] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt. +55: [2023-04-29 11:26:51,902] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +40: [2023-04-29 11:26:51,902] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 320 +19: [2023-04-29 11:26:51,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +19: [2023-04-29 11:26:51,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +19: [2023-04-29 11:26:51,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +19: [2023-04-29 11:26:51,902] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +15: [2023-04-29 11:26:51,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +15: [2023-04-29 11:26:51,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +15: [2023-04-29 11:26:51,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 1: [2023-04-29 11:26:51,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 1: [2023-04-29 11:26:51,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 1: [2023-04-29 11:26:51,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +15: [2023-04-29 11:26:51,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 5: [2023-04-29 11:26:51,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt... + 5: [2023-04-29 11:26:51,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt... + 1: [2023-04-29 11:26:51,904] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 5: [2023-04-29 11:26:51,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt... + 5: [2023-04-29 11:26:51,904] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt... + 8: [2023-04-29 11:26:51,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 11:26:51,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 11:26:51,905] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +17: [2023-04-29 11:26:51,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +17: [2023-04-29 11:26:51,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +17: [2023-04-29 11:26:51,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +55: [2023-04-29 11:26:51,906] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +23: [2023-04-29 11:26:51,906] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 186 +31: [2023-04-29 11:26:51,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +31: [2023-04-29 11:26:51,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +31: [2023-04-29 11:26:51,908] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +31: [2023-04-29 11:26:51,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +49: [2023-04-29 11:26:51,909] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt. +49: [2023-04-29 11:26:51,910] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 398 +12: [2023-04-29 11:26:51,910] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +37: [2023-04-29 11:26:51,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +37: [2023-04-29 11:26:51,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +14: [2023-04-29 11:26:51,913] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 11:26:51,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt... +15: [2023-04-29 11:26:51,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt... +15: [2023-04-29 11:26:51,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt... +15: [2023-04-29 11:26:51,914] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt... +31: [2023-04-29 11:26:51,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt... +31: [2023-04-29 11:26:51,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt... +31: [2023-04-29 11:26:51,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt... +31: [2023-04-29 11:26:51,915] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt... +37: [2023-04-29 11:26:51,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +37: [2023-04-29 11:26:51,916] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +45: [2023-04-29 11:26:51,917] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt. +45: [2023-04-29 11:26:51,917] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 362 +49: [2023-04-29 11:26:51,918] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 398 +17: [2023-04-29 11:26:51,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt... +17: [2023-04-29 11:26:51,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt... +17: [2023-04-29 11:26:51,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt... +17: [2023-04-29 11:26:51,918] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt... +28: [2023-04-29 11:26:51,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +28: [2023-04-29 11:26:51,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +28: [2023-04-29 11:26:51,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +14: [2023-04-29 11:26:51,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 11:26:51,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 11:26:51,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +12: [2023-04-29 11:26:51,920] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 11:26:51,922] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 11:26:51,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +14: [2023-04-29 11:26:51,923] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +45: [2023-04-29 11:26:51,923] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 362 +46: [2023-04-29 11:26:51,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +46: [2023-04-29 11:26:51,926] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +21: [2023-04-29 11:26:51,928] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt... +21: [2023-04-29 11:26:51,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt... +19: [2023-04-29 11:26:51,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 11:26:51,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt... +21: [2023-04-29 11:26:51,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt... +19: [2023-04-29 11:26:51,929] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +59: [2023-04-29 11:26:51,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +46: [2023-04-29 11:26:51,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. + 1: [2023-04-29 11:26:51,930] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +59: [2023-04-29 11:26:51,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +34: [2023-04-29 11:26:51,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +34: [2023-04-29 11:26:51,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +46: [2023-04-29 11:26:51,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +20: [2023-04-29 11:26:51,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 11:26:51,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +34: [2023-04-29 11:26:51,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +34: [2023-04-29 11:26:51,931] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +19: [2023-04-29 11:26:51,931] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +59: [2023-04-29 11:26:51,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt. +59: [2023-04-29 11:26:51,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +59: [2023-04-29 11:26:51,932] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 476 +19: [2023-04-29 11:26:51,932] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +59: [2023-04-29 11:26:51,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +15: [2023-04-29 11:26:51,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,933] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +31: [2023-04-29 11:26:51,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 11:26:51,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 11:26:51,934] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 11:26:51,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +20: [2023-04-29 11:26:51,935] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +15: [2023-04-29 11:26:51,935] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +20: [2023-04-29 11:26:51,936] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +17: [2023-04-29 11:26:51,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 11:26:51,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +49: [2023-04-29 11:26:51,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt... +49: [2023-04-29 11:26:51,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt... +49: [2023-04-29 11:26:51,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt... +49: [2023-04-29 11:26:51,938] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt... +31: [2023-04-29 11:26:51,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +59: [2023-04-29 11:26:51,940] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 476 + 1: [2023-04-29 11:26:51,937] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,940] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +20: [2023-04-29 11:26:51,941] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +31: [2023-04-29 11:26:51,943] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +37: [2023-04-29 11:26:51,944] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +20: [2023-04-29 11:26:51,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +20: [2023-04-29 11:26:51,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +45: [2023-04-29 11:26:51,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +45: [2023-04-29 11:26:51,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +31: [2023-04-29 11:26:51,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +45: [2023-04-29 11:26:51,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +45: [2023-04-29 11:26:51,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +37: [2023-04-29 11:26:51,945] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 11:26:51,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt. + 3: [2023-04-29 11:26:51,945] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt. +49: [2023-04-29 11:26:51,946] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 394 + 3: [2023-04-29 11:26:51,946] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 26 +37: [2023-04-29 11:26:51,947] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:51,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +28: [2023-04-29 11:26:51,948] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +10: [2023-04-29 11:26:51,948] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +36: [2023-04-29 11:26:51,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt... +36: [2023-04-29 11:26:51,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt... +36: [2023-04-29 11:26:51,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt... +36: [2023-04-29 11:26:51,949] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt... +40: [2023-04-29 11:26:51,950] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 326 +41: [2023-04-29 11:26:51,950] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 11:26:51,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +54: [2023-04-29 11:26:51,951] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt. +28: [2023-04-29 11:26:51,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 11:26:51,951] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +54: [2023-04-29 11:26:51,951] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 434 +28: [2023-04-29 11:26:51,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +41: [2023-04-29 11:26:51,952] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +20: [2023-04-29 11:26:51,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +10: [2023-04-29 11:26:51,953] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +20: [2023-04-29 11:26:51,954] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 3: [2023-04-29 11:26:51,954] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 26 +49: [2023-04-29 11:26:51,954] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 394 + 4: [2023-04-29 11:26:51,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 4: [2023-04-29 11:26:51,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 4: [2023-04-29 11:26:51,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 3: [2023-04-29 11:26:51,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 11:26:51,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +41: [2023-04-29 11:26:51,956] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +46: [2023-04-29 11:26:51,957] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 11:26:51,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 11:26:51,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +46: [2023-04-29 11:26:51,957] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 11:26:51,958] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 320 +59: [2023-04-29 11:26:51,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 11:26:51,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 11:26:51,958] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 11:26:51,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +59: [2023-04-29 11:26:51,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 11:26:51,959] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 11:26:51,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,958] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +46: [2023-04-29 11:26:51,959] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 11:26:51,960] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 3: [2023-04-29 11:26:51,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +46: [2023-04-29 11:26:51,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +54: [2023-04-29 11:26:51,961] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 434 + 6: [2023-04-29 11:26:51,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt. +46: [2023-04-29 11:26:51,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +10: [2023-04-29 11:26:51,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +10: [2023-04-29 11:26:51,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 9: [2023-04-29 11:26:51,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 11:26:51,961] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 54 +48: [2023-04-29 11:26:51,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +48: [2023-04-29 11:26:51,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +40: [2023-04-29 11:26:51,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt. +46: [2023-04-29 11:26:51,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 11:26:51,961] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +34: [2023-04-29 11:26:51,961] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 11:26:51,962] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 322 +48: [2023-04-29 11:26:51,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +59: [2023-04-29 11:26:51,962] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +59: [2023-04-29 11:26:51,962] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 0: [2023-04-29 11:26:51,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +10: [2023-04-29 11:26:51,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,963] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +34: [2023-04-29 11:26:51,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 11:26:51,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt. + 0: [2023-04-29 11:26:51,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 9: [2023-04-29 11:26:51,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +58: [2023-04-29 11:26:51,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt. +36: [2023-04-29 11:26:51,964] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 290 +58: [2023-04-29 11:26:51,964] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 468 +34: [2023-04-29 11:26:51,964] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +41: [2023-04-29 11:26:51,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 8: [2023-04-29 11:26:51,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt... + 8: [2023-04-29 11:26:51,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt... + 8: [2023-04-29 11:26:51,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt... +59: [2023-04-29 11:26:51,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +59: [2023-04-29 11:26:51,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +59: [2023-04-29 11:26:51,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +59: [2023-04-29 11:26:51,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... + 8: [2023-04-29 11:26:51,965] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt... +40: [2023-04-29 11:26:51,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +40: [2023-04-29 11:26:51,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +40: [2023-04-29 11:26:51,965] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +41: [2023-04-29 11:26:51,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +56: [2023-04-29 11:26:51,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +56: [2023-04-29 11:26:51,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 3: [2023-04-29 11:26:51,966] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +56: [2023-04-29 11:26:51,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +40: [2023-04-29 11:26:51,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +40: [2023-04-29 11:26:51,966] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 324 +56: [2023-04-29 11:26:51,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 9: [2023-04-29 11:26:51,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt. + 9: [2023-04-29 11:26:51,967] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 74 +34: [2023-04-29 11:26:51,967] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +10: [2023-04-29 11:26:51,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +10: [2023-04-29 11:26:51,968] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +40: [2023-04-29 11:26:51,969] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 322 + 9: [2023-04-29 11:26:51,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 9: [2023-04-29 11:26:51,969] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 6: [2023-04-29 11:26:51,969] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 54 +10: [2023-04-29 11:26:51,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +46: [2023-04-29 11:26:51,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +46: [2023-04-29 11:26:51,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +46: [2023-04-29 11:26:51,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +46: [2023-04-29 11:26:51,970] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +59: [2023-04-29 11:26:51,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +59: [2023-04-29 11:26:51,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +59: [2023-04-29 11:26:51,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +59: [2023-04-29 11:26:51,970] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +47: [2023-04-29 11:26:51,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt. +45: [2023-04-29 11:26:51,971] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +47: [2023-04-29 11:26:51,971] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 378 + 3: [2023-04-29 11:26:51,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,972] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 11:26:51,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +12: [2023-04-29 11:26:51,973] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +45: [2023-04-29 11:26:51,973] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +58: [2023-04-29 11:26:51,973] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 468 + 9: [2023-04-29 11:26:51,974] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 74 +36: [2023-04-29 11:26:51,975] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 290 +45: [2023-04-29 11:26:51,976] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +46: [2023-04-29 11:26:51,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +46: [2023-04-29 11:26:51,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +46: [2023-04-29 11:26:51,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +46: [2023-04-29 11:26:51,978] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +12: [2023-04-29 11:26:51,978] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 3: [2023-04-29 11:26:51,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +47: [2023-04-29 11:26:51,979] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 378 +45: [2023-04-29 11:26:51,979] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +14: [2023-04-29 11:26:51,979] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 11:26:51,980] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +22: [2023-04-29 11:26:51,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +22: [2023-04-29 11:26:51,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +22: [2023-04-29 11:26:51,982] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +14: [2023-04-29 11:26:51,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:51,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +44: [2023-04-29 11:26:51,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +44: [2023-04-29 11:26:51,983] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 4: [2023-04-29 11:26:51,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 11:26:51,984] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 11:26:51,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 4: [2023-04-29 11:26:51,985] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +49: [2023-04-29 11:26:51,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt. +49: [2023-04-29 11:26:51,986] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 392 +24: [2023-04-29 11:26:51,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +24: [2023-04-29 11:26:51,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +44: [2023-04-29 11:26:51,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +14: [2023-04-29 11:26:51,986] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +24: [2023-04-29 11:26:51,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +24: [2023-04-29 11:26:51,986] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +14: [2023-04-29 11:26:51,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +48: [2023-04-29 11:26:51,987] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +26: [2023-04-29 11:26:51,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +26: [2023-04-29 11:26:51,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +26: [2023-04-29 11:26:51,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +26: [2023-04-29 11:26:51,987] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +14: [2023-04-29 11:26:51,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +44: [2023-04-29 11:26:51,988] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +61: [2023-04-29 11:26:51,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +61: [2023-04-29 11:26:51,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +61: [2023-04-29 11:26:51,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +12: [2023-04-29 11:26:51,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,990] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +61: [2023-04-29 11:26:51,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +19: [2023-04-29 11:26:51,991] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 11:26:51,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +27: [2023-04-29 11:26:51,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +27: [2023-04-29 11:26:51,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +27: [2023-04-29 11:26:51,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 0: [2023-04-29 11:26:51,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 11:26:51,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +48: [2023-04-29 11:26:51,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +48: [2023-04-29 11:26:51,993] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +12: [2023-04-29 11:26:51,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +12: [2023-04-29 11:26:51,993] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +48: [2023-04-29 11:26:51,994] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +49: [2023-04-29 11:26:51,994] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 392 +19: [2023-04-29 11:26:51,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 11:26:51,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 11:26:51,995] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +45: [2023-04-29 11:26:51,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt. +45: [2023-04-29 11:26:51,995] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt. +45: [2023-04-29 11:26:51,996] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 364 +45: [2023-04-29 11:26:51,996] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 366 + 0: [2023-04-29 11:26:51,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +19: [2023-04-29 11:26:51,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +56: [2023-04-29 11:26:51,996] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +15: [2023-04-29 11:26:51,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +40: [2023-04-29 11:26:51,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +56: [2023-04-29 11:26:51,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +12: [2023-04-29 11:26:51,997] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 1: [2023-04-29 11:26:51,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +56: [2023-04-29 11:26:51,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 1: [2023-04-29 11:26:51,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +56: [2023-04-29 11:26:51,998] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +17: [2023-04-29 11:26:51,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +19: [2023-04-29 11:26:51,999] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +19: [2023-04-29 11:26:51,999] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +40: [2023-04-29 11:26:52,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 11:26:52,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 11:26:52,000] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 0: [2023-04-29 11:26:52,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt. +31: [2023-04-29 11:26:52,000] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +12: [2023-04-29 11:26:52,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 0: [2023-04-29 11:26:52,001] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 4 +12: [2023-04-29 11:26:52,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +14: [2023-04-29 11:26:52,001] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +21: [2023-04-29 11:26:52,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +21: [2023-04-29 11:26:52,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +19: [2023-04-29 11:26:52,002] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 11:26:52,003] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 1: [2023-04-29 11:26:52,004] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +21: [2023-04-29 11:26:52,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +29: [2023-04-29 11:26:52,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +29: [2023-04-29 11:26:52,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +29: [2023-04-29 11:26:52,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +21: [2023-04-29 11:26:52,004] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +11: [2023-04-29 11:26:52,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +11: [2023-04-29 11:26:52,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +15: [2023-04-29 11:26:52,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +11: [2023-04-29 11:26:52,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +11: [2023-04-29 11:26:52,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +19: [2023-04-29 11:26:52,005] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +17: [2023-04-29 11:26:52,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 11:26:52,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 11:26:52,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt. +17: [2023-04-29 11:26:52,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 11:26:52,006] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 30 +53: [2023-04-29 11:26:52,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +53: [2023-04-29 11:26:52,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +57: [2023-04-29 11:26:52,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 1: [2023-04-29 11:26:52,005] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +57: [2023-04-29 11:26:52,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +57: [2023-04-29 11:26:52,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +53: [2023-04-29 11:26:52,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +53: [2023-04-29 11:26:52,006] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 0: [2023-04-29 11:26:52,007] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 4 +57: [2023-04-29 11:26:52,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +19: [2023-04-29 11:26:52,007] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +29: [2023-04-29 11:26:52,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +17: [2023-04-29 11:26:52,008] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +45: [2023-04-29 11:26:52,009] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 366 +45: [2023-04-29 11:26:52,009] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 364 +15: [2023-04-29 11:26:52,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 11:26:52,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 11:26:52,009] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +37: [2023-04-29 11:26:52,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 1: [2023-04-29 11:26:52,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 6: [2023-04-29 11:26:52,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 6: [2023-04-29 11:26:52,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 6: [2023-04-29 11:26:52,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +22: [2023-04-29 11:26:52,010] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 6: [2023-04-29 11:26:52,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +44: [2023-04-29 11:26:52,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +31: [2023-04-29 11:26:52,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +44: [2023-04-29 11:26:52,011] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +13: [2023-04-29 11:26:52,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +13: [2023-04-29 11:26:52,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +13: [2023-04-29 11:26:52,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +17: [2023-04-29 11:26:52,012] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +13: [2023-04-29 11:26:52,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +31: [2023-04-29 11:26:52,012] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 11:26:52,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 11:26:52,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 11:26:52,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +44: [2023-04-29 11:26:52,013] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 1: [2023-04-29 11:26:52,013] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 11:26:52,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +37: [2023-04-29 11:26:52,014] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +28: [2023-04-29 11:26:52,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 3: [2023-04-29 11:26:52,015] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 30 +15: [2023-04-29 11:26:52,015] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +15: [2023-04-29 11:26:52,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +26: [2023-04-29 11:26:52,016] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +44: [2023-04-29 11:26:52,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +61: [2023-04-29 11:26:52,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +34: [2023-04-29 11:26:52,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt. +24: [2023-04-29 11:26:52,017] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +34: [2023-04-29 11:26:52,017] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 276 +61: [2023-04-29 11:26:52,018] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +31: [2023-04-29 11:26:52,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +31: [2023-04-29 11:26:52,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +37: [2023-04-29 11:26:52,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +24: [2023-04-29 11:26:52,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +17: [2023-04-29 11:26:52,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +31: [2023-04-29 11:26:52,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +26: [2023-04-29 11:26:52,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 11:26:52,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 1: [2023-04-29 11:26:52,019] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +24: [2023-04-29 11:26:52,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +22: [2023-04-29 11:26:52,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +27: [2023-04-29 11:26:52,020] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +27: [2023-04-29 11:26:52,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +27: [2023-04-29 11:26:52,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +27: [2023-04-29 11:26:52,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 11:26:52,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +61: [2023-04-29 11:26:52,021] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 11:26:52,022] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +61: [2023-04-29 11:26:52,022] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +28: [2023-04-29 11:26:52,023] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +37: [2023-04-29 11:26:52,023] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +26: [2023-04-29 11:26:52,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +31: [2023-04-29 11:26:52,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +31: [2023-04-29 11:26:52,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +26: [2023-04-29 11:26:52,024] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 11:26:52,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +28: [2023-04-29 11:26:52,025] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +34: [2023-04-29 11:26:52,025] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 276 +34: [2023-04-29 11:26:52,027] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt. +34: [2023-04-29 11:26:52,028] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 272 +28: [2023-04-29 11:26:52,028] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +34: [2023-04-29 11:26:52,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt. +18: [2023-04-29 11:26:52,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt. +34: [2023-04-29 11:26:52,029] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 278 +18: [2023-04-29 11:26:52,029] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 148 +60: [2023-04-29 11:26:52,029] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt. +60: [2023-04-29 11:26:52,029] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 482 +59: [2023-04-29 11:26:52,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt... +59: [2023-04-29 11:26:52,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt... +59: [2023-04-29 11:26:52,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt... +59: [2023-04-29 11:26:52,030] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt... +37: [2023-04-29 11:26:52,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +29: [2023-04-29 11:26:52,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +28: [2023-04-29 11:26:52,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +28: [2023-04-29 11:26:52,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +34: [2023-04-29 11:26:52,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +11: [2023-04-29 11:26:52,031] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +34: [2023-04-29 11:26:52,031] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 11:26:52,032] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +25: [2023-04-29 11:26:52,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt. +57: [2023-04-29 11:26:52,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +29: [2023-04-29 11:26:52,033] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +25: [2023-04-29 11:26:52,033] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 202 +41: [2023-04-29 11:26:52,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt. +41: [2023-04-29 11:26:52,033] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 334 +21: [2023-04-29 11:26:52,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 11:26:52,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +21: [2023-04-29 11:26:52,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 11:26:52,034] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +57: [2023-04-29 11:26:52,035] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +18: [2023-04-29 11:26:52,035] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 148 +34: [2023-04-29 11:26:52,035] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 272 +61: [2023-04-29 11:26:52,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt. +61: [2023-04-29 11:26:52,036] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 490 +21: [2023-04-29 11:26:52,037] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +47: [2023-04-29 11:26:52,037] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt. +57: [2023-04-29 11:26:52,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 11:26:52,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +53: [2023-04-29 11:26:52,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +34: [2023-04-29 11:26:52,037] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 278 +53: [2023-04-29 11:26:52,036] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +37: [2023-04-29 11:26:52,036] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 11:26:52,037] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 382 +36: [2023-04-29 11:26:52,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt. +52: [2023-04-29 11:26:52,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +52: [2023-04-29 11:26:52,038] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +57: [2023-04-29 11:26:52,038] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +36: [2023-04-29 11:26:52,038] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 294 +60: [2023-04-29 11:26:52,038] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 482 +11: [2023-04-29 11:26:52,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 11:26:52,039] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 11:26:52,040] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 202 + 2: [2023-04-29 11:26:52,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 2: [2023-04-29 11:26:52,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 2: [2023-04-29 11:26:52,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +52: [2023-04-29 11:26:52,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 2: [2023-04-29 11:26:52,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +52: [2023-04-29 11:26:52,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +45: [2023-04-29 11:26:52,040] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 11:26:52,041] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 334 +29: [2023-04-29 11:26:52,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 6: [2023-04-29 11:26:52,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 11:26:52,041] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +34: [2023-04-29 11:26:52,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +11: [2023-04-29 11:26:52,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +34: [2023-04-29 11:26:52,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +13: [2023-04-29 11:26:52,043] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +61: [2023-04-29 11:26:52,043] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 490 +13: [2023-04-29 11:26:52,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +37: [2023-04-29 11:26:52,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +13: [2023-04-29 11:26:52,044] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 6: [2023-04-29 11:26:52,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 6: [2023-04-29 11:26:52,045] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +47: [2023-04-29 11:26:52,045] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 382 +45: [2023-04-29 11:26:52,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +34: [2023-04-29 11:26:52,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 11:26:52,046] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +50: [2023-04-29 11:26:52,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +50: [2023-04-29 11:26:52,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +50: [2023-04-29 11:26:52,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +50: [2023-04-29 11:26:52,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +34: [2023-04-29 11:26:52,046] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +46: [2023-04-29 11:26:52,047] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt. +13: [2023-04-29 11:26:52,047] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +46: [2023-04-29 11:26:52,047] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 372 +36: [2023-04-29 11:26:52,047] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 294 +48: [2023-04-29 11:26:52,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 11:26:52,050] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 4: [2023-04-29 11:26:52,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 11:26:52,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 4: [2023-04-29 11:26:52,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +34: [2023-04-29 11:26:52,053] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 4: [2023-04-29 11:26:52,053] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +56: [2023-04-29 11:26:52,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +45: [2023-04-29 11:26:52,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 11:26:52,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +47: [2023-04-29 11:26:52,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +46: [2023-04-29 11:26:52,055] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 372 +34: [2023-04-29 11:26:52,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +48: [2023-04-29 11:26:52,056] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 3: [2023-04-29 11:26:52,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt. +28: [2023-04-29 11:26:52,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt. +28: [2023-04-29 11:26:52,057] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 228 + 3: [2023-04-29 11:26:52,057] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 28 + 0: [2023-04-29 11:26:52,057] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 0: [2023-04-29 11:26:52,058] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +47: [2023-04-29 11:26:52,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +56: [2023-04-29 11:26:52,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +27: [2023-04-29 11:26:52,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt. +37: [2023-04-29 11:26:52,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt. +27: [2023-04-29 11:26:52,059] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 222 +47: [2023-04-29 11:26:52,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 1: [2023-04-29 11:26:52,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt. + 4: [2023-04-29 11:26:52,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 4: [2023-04-29 11:26:52,059] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 1: [2023-04-29 11:26:52,060] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 10 + 4: [2023-04-29 11:26:52,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 4: [2023-04-29 11:26:52,060] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +45: [2023-04-29 11:26:52,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 11:26:52,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 11:26:52,059] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 300 +45: [2023-04-29 11:26:52,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 0: [2023-04-29 11:26:52,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 0: [2023-04-29 11:26:52,063] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +48: [2023-04-29 11:26:52,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 3: [2023-04-29 11:26:52,065] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 28 +48: [2023-04-29 11:26:52,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +48: [2023-04-29 11:26:52,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 11:26:52,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +40: [2023-04-29 11:26:52,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 7: [2023-04-29 11:26:52,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +40: [2023-04-29 11:26:52,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 7: [2023-04-29 11:26:52,066] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +52: [2023-04-29 11:26:52,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 11:26:52,066] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +28: [2023-04-29 11:26:52,067] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 228 + 7: [2023-04-29 11:26:52,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +56: [2023-04-29 11:26:52,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 7: [2023-04-29 11:26:52,067] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +27: [2023-04-29 11:26:52,068] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 222 + 1: [2023-04-29 11:26:52,068] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 10 +37: [2023-04-29 11:26:52,068] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 300 +57: [2023-04-29 11:26:52,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt. +57: [2023-04-29 11:26:52,068] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 456 +53: [2023-04-29 11:26:52,068] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt. +53: [2023-04-29 11:26:52,069] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 428 +45: [2023-04-29 11:26:52,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 2: [2023-04-29 11:26:52,069] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 11:26:52,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +18: [2023-04-29 11:26:52,069] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +18: [2023-04-29 11:26:52,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +18: [2023-04-29 11:26:52,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 2: [2023-04-29 11:26:52,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +56: [2023-04-29 11:26:52,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +56: [2023-04-29 11:26:52,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 11:26:52,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +52: [2023-04-29 11:26:52,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 5: [2023-04-29 11:26:52,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 5: [2023-04-29 11:26:52,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 5: [2023-04-29 11:26:52,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +48: [2023-04-29 11:26:52,070] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 5: [2023-04-29 11:26:52,070] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +46: [2023-04-29 11:26:52,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt... +46: [2023-04-29 11:26:52,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt... +46: [2023-04-29 11:26:52,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt... +46: [2023-04-29 11:26:52,071] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt... +40: [2023-04-29 11:26:52,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 11:26:52,071] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +48: [2023-04-29 11:26:52,072] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 0: [2023-04-29 11:26:52,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +59: [2023-04-29 11:26:52,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt. +59: [2023-04-29 11:26:52,072] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 478 +24: [2023-04-29 11:26:52,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +40: [2023-04-29 11:26:52,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +40: [2023-04-29 11:26:52,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +40: [2023-04-29 11:26:52,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +52: [2023-04-29 11:26:52,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt. + 2: [2023-04-29 11:26:52,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +52: [2023-04-29 11:26:52,073] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 422 +56: [2023-04-29 11:26:52,074] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +30: [2023-04-29 11:26:52,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +30: [2023-04-29 11:26:52,073] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 2: [2023-04-29 11:26:52,073] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +44: [2023-04-29 11:26:52,075] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +57: [2023-04-29 11:26:52,075] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 456 + 0: [2023-04-29 11:26:52,075] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +46: [2023-04-29 11:26:52,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt. +50: [2023-04-29 11:26:52,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +46: [2023-04-29 11:26:52,076] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 368 +50: [2023-04-29 11:26:52,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +30: [2023-04-29 11:26:52,076] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +50: [2023-04-29 11:26:52,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 11:26:52,076] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +40: [2023-04-29 11:26:52,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +53: [2023-04-29 11:26:52,077] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 428 +44: [2023-04-29 11:26:52,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +30: [2023-04-29 11:26:52,077] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +56: [2023-04-29 11:26:52,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +24: [2023-04-29 11:26:52,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +56: [2023-04-29 11:26:52,077] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +27: [2023-04-29 11:26:52,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 11:26:52,078] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +22: [2023-04-29 11:26:52,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 11:26:52,079] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +16: [2023-04-29 11:26:52,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. + 0: [2023-04-29 11:26:52,080] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +42: [2023-04-29 11:26:52,080] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt. +42: [2023-04-29 11:26:52,080] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 342 +52: [2023-04-29 11:26:52,080] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 422 +47: [2023-04-29 11:26:52,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +44: [2023-04-29 11:26:52,081] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +59: [2023-04-29 11:26:52,081] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 478 +47: [2023-04-29 11:26:52,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 0: [2023-04-29 11:26:52,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +16: [2023-04-29 11:26:52,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +44: [2023-04-29 11:26:52,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 11:26:52,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +27: [2023-04-29 11:26:52,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +27: [2023-04-29 11:26:52,082] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +22: [2023-04-29 11:26:52,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +27: [2023-04-29 11:26:52,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 11:26:52,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 11:26:52,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_21-model_01-model_states.pt. +52: [2023-04-29 11:26:52,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt. +61: [2023-04-29 11:26:52,084] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 11:26:52,085] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 416 +46: [2023-04-29 11:26:52,085] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 368 +27: [2023-04-29 11:26:52,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +47: [2023-04-29 11:26:52,087] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +26: [2023-04-29 11:26:52,088] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +42: [2023-04-29 11:26:52,088] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 342 +27: [2023-04-29 11:26:52,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +34: [2023-04-29 11:26:52,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt. +44: [2023-04-29 11:26:52,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +26: [2023-04-29 11:26:52,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +34: [2023-04-29 11:26:52,089] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 274 +44: [2023-04-29 11:26:52,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +61: [2023-04-29 11:26:52,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +22: [2023-04-29 11:26:52,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +22: [2023-04-29 11:26:52,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +48: [2023-04-29 11:26:52,089] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt. +26: [2023-04-29 11:26:52,089] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +48: [2023-04-29 11:26:52,089] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 388 +61: [2023-04-29 11:26:52,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +61: [2023-04-29 11:26:52,090] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +24: [2023-04-29 11:26:52,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 11:26:52,090] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 11:26:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +47: [2023-04-29 11:26:52,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... + 7: [2023-04-29 11:26:52,091] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +24: [2023-04-29 11:26:52,091] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 11:26:52,092] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +46: [2023-04-29 11:26:52,093] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt. +52: [2023-04-29 11:26:52,093] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 416 +46: [2023-04-29 11:26:52,093] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 374 +26: [2023-04-29 11:26:52,093] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +61: [2023-04-29 11:26:52,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +27: [2023-04-29 11:26:52,094] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +25: [2023-04-29 11:26:52,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +25: [2023-04-29 11:26:52,094] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +26: [2023-04-29 11:26:52,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +57: [2023-04-29 11:26:52,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +11: [2023-04-29 11:26:52,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:52,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +61: [2023-04-29 11:26:52,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 7: [2023-04-29 11:26:52,095] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +44: [2023-04-29 11:26:52,095] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt. +61: [2023-04-29 11:26:52,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +44: [2023-04-29 11:26:52,096] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 358 + 6: [2023-04-29 11:26:52,096] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +29: [2023-04-29 11:26:52,096] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +28: [2023-04-29 11:26:52,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt. +28: [2023-04-29 11:26:52,097] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 224 +22: [2023-04-29 11:26:52,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +18: [2023-04-29 11:26:52,097] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 11:26:52,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +21: [2023-04-29 11:26:52,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +48: [2023-04-29 11:26:52,097] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 388 +25: [2023-04-29 11:26:52,097] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +24: [2023-04-29 11:26:52,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +24: [2023-04-29 11:26:52,098] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +29: [2023-04-29 11:26:52,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +26: [2023-04-29 11:26:52,098] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +24: [2023-04-29 11:26:52,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 5: [2023-04-29 11:26:52,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 11:26:52,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +11: [2023-04-29 11:26:52,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 7: [2023-04-29 11:26:52,099] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +18: [2023-04-29 11:26:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +57: [2023-04-29 11:26:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 5: [2023-04-29 11:26:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +34: [2023-04-29 11:26:52,100] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 274 +61: [2023-04-29 11:26:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +18: [2023-04-29 11:26:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 11:26:52,100] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 5: [2023-04-29 11:26:52,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 5: [2023-04-29 11:26:52,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 6: [2023-04-29 11:26:52,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +30: [2023-04-29 11:26:52,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +30: [2023-04-29 11:26:52,101] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +53: [2023-04-29 11:26:52,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 11:26:52,101] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +22: [2023-04-29 11:26:52,102] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +29: [2023-04-29 11:26:52,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +46: [2023-04-29 11:26:52,103] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 374 +44: [2023-04-29 11:26:52,103] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 358 +21: [2023-04-29 11:26:52,103] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +28: [2023-04-29 11:26:52,105] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 224 +30: [2023-04-29 11:26:52,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 11:26:52,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +22: [2023-04-29 11:26:52,106] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +57: [2023-04-29 11:26:52,106] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 6: [2023-04-29 11:26:52,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 11:26:52,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +29: [2023-04-29 11:26:52,107] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 11:26:52,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +48: [2023-04-29 11:26:52,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt. +48: [2023-04-29 11:26:52,110] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 384 +57: [2023-04-29 11:26:52,110] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +53: [2023-04-29 11:26:52,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +53: [2023-04-29 11:26:52,110] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +53: [2023-04-29 11:26:52,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +58: [2023-04-29 11:26:52,111] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt. +58: [2023-04-29 11:26:52,111] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 464 +57: [2023-04-29 11:26:52,112] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 6: [2023-04-29 11:26:52,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +57: [2023-04-29 11:26:52,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +21: [2023-04-29 11:26:52,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +16: [2023-04-29 11:26:52,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +16: [2023-04-29 11:26:52,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +29: [2023-04-29 11:26:52,113] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +13: [2023-04-29 11:26:52,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +13: [2023-04-29 11:26:52,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 6: [2023-04-29 11:26:52,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 6: [2023-04-29 11:26:52,113] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 11:26:52,114] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +53: [2023-04-29 11:26:52,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +11: [2023-04-29 11:26:52,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 11:26:52,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +11: [2023-04-29 11:26:52,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +37: [2023-04-29 11:26:52,115] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt. +57: [2023-04-29 11:26:52,115] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +37: [2023-04-29 11:26:52,115] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 302 +29: [2023-04-29 11:26:52,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +57: [2023-04-29 11:26:52,116] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt. +57: [2023-04-29 11:26:52,116] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 460 +13: [2023-04-29 11:26:52,117] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +21: [2023-04-29 11:26:52,117] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +53: [2023-04-29 11:26:52,118] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +48: [2023-04-29 11:26:52,118] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 384 +57: [2023-04-29 11:26:52,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 6: [2023-04-29 11:26:52,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +16: [2023-04-29 11:26:52,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... + 6: [2023-04-29 11:26:52,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +21: [2023-04-29 11:26:52,119] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +58: [2023-04-29 11:26:52,120] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 464 +43: [2023-04-29 11:26:52,120] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt. +43: [2023-04-29 11:26:52,120] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 345 +23: [2023-04-29 11:26:52,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +23: [2023-04-29 11:26:52,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +23: [2023-04-29 11:26:52,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +53: [2023-04-29 11:26:52,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +23: [2023-04-29 11:26:52,121] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +25: [2023-04-29 11:26:52,121] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 11:26:52,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt... +13: [2023-04-29 11:26:52,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +13: [2023-04-29 11:26:52,122] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +29: [2023-04-29 11:26:52,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +13: [2023-04-29 11:26:52,123] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +57: [2023-04-29 11:26:52,123] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 460 +13: [2023-04-29 11:26:52,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +11: [2023-04-29 11:26:52,123] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +11: [2023-04-29 11:26:52,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +37: [2023-04-29 11:26:52,124] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 302 +11: [2023-04-29 11:26:52,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +25: [2023-04-29 11:26:52,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 11:26:52,124] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 11:26:52,127] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +42: [2023-04-29 11:26:52,128] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt. +42: [2023-04-29 11:26:52,128] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 336 +13: [2023-04-29 11:26:52,128] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 1: [2023-04-29 11:26:52,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt. + 1: [2023-04-29 11:26:52,130] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 14 +57: [2023-04-29 11:26:52,129] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt. +57: [2023-04-29 11:26:52,130] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 458 +41: [2023-04-29 11:26:52,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt. +50: [2023-04-29 11:26:52,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt. +41: [2023-04-29 11:26:52,133] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 332 +50: [2023-04-29 11:26:52,133] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 404 + 2: [2023-04-29 11:26:52,133] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +52: [2023-04-29 11:26:52,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 11:26:52,134] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 11:26:52,135] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt. +42: [2023-04-29 11:26:52,135] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 338 +42: [2023-04-29 11:26:52,137] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 336 +61: [2023-04-29 11:26:52,137] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt. +61: [2023-04-29 11:26:52,137] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 488 + 1: [2023-04-29 11:26:52,137] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 14 +57: [2023-04-29 11:26:52,137] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 458 +55: [2023-04-29 11:26:52,138] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt. + 2: [2023-04-29 11:26:52,138] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +55: [2023-04-29 11:26:52,139] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 440 +41: [2023-04-29 11:26:52,139] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 332 +50: [2023-04-29 11:26:52,140] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 404 +52: [2023-04-29 11:26:52,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +52: [2023-04-29 11:26:52,141] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +52: [2023-04-29 11:26:52,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 11:26:52,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt. +55: [2023-04-29 11:26:52,142] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 446 +50: [2023-04-29 11:26:52,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 11:26:52,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 11:26:52,142] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 338 +52: [2023-04-29 11:26:52,142] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 1: [2023-04-29 11:26:52,144] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt. + 1: [2023-04-29 11:26:52,144] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 8 + 2: [2023-04-29 11:26:52,145] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +55: [2023-04-29 11:26:52,146] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 440 +23: [2023-04-29 11:26:52,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 11:26:52,145] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 0: [2023-04-29 11:26:52,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt. +61: [2023-04-29 11:26:52,146] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 488 +44: [2023-04-29 11:26:52,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt. + 0: [2023-04-29 11:26:52,146] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 2 +50: [2023-04-29 11:26:52,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +50: [2023-04-29 11:26:52,146] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +44: [2023-04-29 11:26:52,146] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 354 +47: [2023-04-29 11:26:52,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +52: [2023-04-29 11:26:52,147] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 2: [2023-04-29 11:26:52,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 2: [2023-04-29 11:26:52,147] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +52: [2023-04-29 11:26:52,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +53: [2023-04-29 11:26:52,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt. +33: [2023-04-29 11:26:52,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt. +53: [2023-04-29 11:26:52,148] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 424 +18: [2023-04-29 11:26:52,148] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt. +50: [2023-04-29 11:26:52,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +50: [2023-04-29 11:26:52,148] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +55: [2023-04-29 11:26:52,149] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 446 +18: [2023-04-29 11:26:52,148] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 146 +33: [2023-04-29 11:26:52,148] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 265 +23: [2023-04-29 11:26:52,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +23: [2023-04-29 11:26:52,149] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +47: [2023-04-29 11:26:52,149] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +37: [2023-04-29 11:26:52,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt. +37: [2023-04-29 11:26:52,150] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 296 +35: [2023-04-29 11:26:52,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +35: [2023-04-29 11:26:52,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +47: [2023-04-29 11:26:52,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt. +47: [2023-04-29 11:26:52,151] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 376 +35: [2023-04-29 11:26:52,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 2: [2023-04-29 11:26:52,152] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +35: [2023-04-29 11:26:52,151] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. + 1: [2023-04-29 11:26:52,151] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 8 +61: [2023-04-29 11:26:52,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt. +61: [2023-04-29 11:26:52,153] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 492 +50: [2023-04-29 11:26:52,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +30: [2023-04-29 11:26:52,153] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 11:26:52,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +50: [2023-04-29 11:26:52,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 2: [2023-04-29 11:26:52,153] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +44: [2023-04-29 11:26:52,154] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 354 +47: [2023-04-29 11:26:52,155] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 0: [2023-04-29 11:26:52,155] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 2 +42: [2023-04-29 11:26:52,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +42: [2023-04-29 11:26:52,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +42: [2023-04-29 11:26:52,156] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +42: [2023-04-29 11:26:52,157] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_43-model_01-model_states.pt. +47: [2023-04-29 11:26:52,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +18: [2023-04-29 11:26:52,157] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 146 +53: [2023-04-29 11:26:52,157] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 424 +47: [2023-04-29 11:26:52,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +30: [2023-04-29 11:26:52,157] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 7: [2023-04-29 11:26:52,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +59: [2023-04-29 11:26:52,158] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt. +47: [2023-04-29 11:26:52,158] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 376 +59: [2023-04-29 11:26:52,158] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 472 +37: [2023-04-29 11:26:52,159] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 296 + 7: [2023-04-29 11:26:52,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +47: [2023-04-29 11:26:52,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +47: [2023-04-29 11:26:52,160] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +47: [2023-04-29 11:26:52,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt. +47: [2023-04-29 11:26:52,161] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 380 +41: [2023-04-29 11:26:52,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt. +61: [2023-04-29 11:26:52,161] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 492 +41: [2023-04-29 11:26:52,161] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 330 +53: [2023-04-29 11:26:52,161] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt. +53: [2023-04-29 11:26:52,162] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 426 + 7: [2023-04-29 11:26:52,162] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 7: [2023-04-29 11:26:52,163] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... + 7: [2023-04-29 11:26:52,164] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +36: [2023-04-29 11:26:52,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt. +33: [2023-04-29 11:26:52,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt. +36: [2023-04-29 11:26:52,164] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 288 +33: [2023-04-29 11:26:52,164] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 267 + 7: [2023-04-29 11:26:52,164] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 11:26:52,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 8: [2023-04-29 11:26:52,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 8: [2023-04-29 11:26:52,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 8: [2023-04-29 11:26:52,165] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +18: [2023-04-29 11:26:52,166] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 11:26:52,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +59: [2023-04-29 11:26:52,167] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 472 +47: [2023-04-29 11:26:52,167] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +28: [2023-04-29 11:26:52,168] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt. +28: [2023-04-29 11:26:52,168] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 230 +41: [2023-04-29 11:26:52,168] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 330 + 5: [2023-04-29 11:26:52,169] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +47: [2023-04-29 11:26:52,169] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 380 +30: [2023-04-29 11:26:52,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 11:26:52,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 11:26:52,170] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 11:26:52,170] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +53: [2023-04-29 11:26:52,171] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 426 +36: [2023-04-29 11:26:52,171] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 288 + 9: [2023-04-29 11:26:52,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 9: [2023-04-29 11:26:52,171] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +18: [2023-04-29 11:26:52,172] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +59: [2023-04-29 11:26:52,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt. +59: [2023-04-29 11:26:52,172] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 474 + 5: [2023-04-29 11:26:52,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 5: [2023-04-29 11:26:52,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 11:26:52,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 11:26:52,173] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 9: [2023-04-29 11:26:52,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +55: [2023-04-29 11:26:52,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +55: [2023-04-29 11:26:52,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. + 9: [2023-04-29 11:26:52,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +28: [2023-04-29 11:26:52,175] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 230 + 5: [2023-04-29 11:26:52,175] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +30: [2023-04-29 11:26:52,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 5: [2023-04-29 11:26:52,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +18: [2023-04-29 11:26:52,176] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 11:26:52,176] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +55: [2023-04-29 11:26:52,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +55: [2023-04-29 11:26:52,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +18: [2023-04-29 11:26:52,177] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +41: [2023-04-29 11:26:52,177] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt. +41: [2023-04-29 11:26:52,177] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 328 + 5: [2023-04-29 11:26:52,178] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +46: [2023-04-29 11:26:52,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt. +25: [2023-04-29 11:26:52,178] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +46: [2023-04-29 11:26:52,178] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 370 + 5: [2023-04-29 11:26:52,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +30: [2023-04-29 11:26:52,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +18: [2023-04-29 11:26:52,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +35: [2023-04-29 11:26:52,179] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +59: [2023-04-29 11:26:52,180] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 474 +50: [2023-04-29 11:26:52,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt. +50: [2023-04-29 11:26:52,181] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 402 + 5: [2023-04-29 11:26:52,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +25: [2023-04-29 11:26:52,182] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +35: [2023-04-29 11:26:52,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +35: [2023-04-29 11:26:52,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +35: [2023-04-29 11:26:52,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +18: [2023-04-29 11:26:52,183] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +16: [2023-04-29 11:26:52,184] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +41: [2023-04-29 11:26:52,185] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 328 +42: [2023-04-29 11:26:52,185] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +16: [2023-04-29 11:26:52,186] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +46: [2023-04-29 11:26:52,186] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 370 +16: [2023-04-29 11:26:52,189] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. +42: [2023-04-29 11:26:52,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +50: [2023-04-29 11:26:52,189] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 402 +42: [2023-04-29 11:26:52,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +42: [2023-04-29 11:26:52,189] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt... +39: [2023-04-29 11:26:52,191] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt. +39: [2023-04-29 11:26:52,191] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 319 +16: [2023-04-29 11:26:52,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +16: [2023-04-29 11:26:52,191] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +55: [2023-04-29 11:26:52,193] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt. +55: [2023-04-29 11:26:52,193] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 444 +20: [2023-04-29 11:26:52,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +20: [2023-04-29 11:26:52,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +20: [2023-04-29 11:26:52,194] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +20: [2023-04-29 11:26:52,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +25: [2023-04-29 11:26:52,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +25: [2023-04-29 11:26:52,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +16: [2023-04-29 11:26:52,195] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +44: [2023-04-29 11:26:52,195] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt. +44: [2023-04-29 11:26:52,195] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 352 + 8: [2023-04-29 11:26:52,197] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 11:26:52,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 11:26:52,199] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 11:26:52,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt. +27: [2023-04-29 11:26:52,200] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 220 +62: [2023-04-29 11:26:52,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt. +62: [2023-04-29 11:26:52,200] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 497 +16: [2023-04-29 11:26:52,200] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_00-model_states.pt. + 8: [2023-04-29 11:26:52,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 8: [2023-04-29 11:26:52,200] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 11:26:52,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt. +13: [2023-04-29 11:26:52,201] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 110 +57: [2023-04-29 11:26:52,201] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt. +57: [2023-04-29 11:26:52,202] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 462 +25: [2023-04-29 11:26:52,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +55: [2023-04-29 11:26:52,202] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 444 +25: [2023-04-29 11:26:52,202] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +44: [2023-04-29 11:26:52,203] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 352 + 9: [2023-04-29 11:26:52,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +55: [2023-04-29 11:26:52,203] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 11:26:52,203] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 11:26:52,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt. +49: [2023-04-29 11:26:52,204] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 396 +25: [2023-04-29 11:26:52,205] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt. +25: [2023-04-29 11:26:52,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +25: [2023-04-29 11:26:52,205] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 206 +55: [2023-04-29 11:26:52,205] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... + 9: [2023-04-29 11:26:52,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 11:26:52,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 9: [2023-04-29 11:26:52,206] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 11:26:52,207] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt... +18: [2023-04-29 11:26:52,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt. +18: [2023-04-29 11:26:52,208] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 150 +27: [2023-04-29 11:26:52,208] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 220 +41: [2023-04-29 11:26:52,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +41: [2023-04-29 11:26:52,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +41: [2023-04-29 11:26:52,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +41: [2023-04-29 11:26:52,208] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +13: [2023-04-29 11:26:52,208] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 110 +57: [2023-04-29 11:26:52,209] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 462 +55: [2023-04-29 11:26:52,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +23: [2023-04-29 11:26:52,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +23: [2023-04-29 11:26:52,210] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +55: [2023-04-29 11:26:52,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 11:26:52,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 11:26:52,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +55: [2023-04-29 11:26:52,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 11:26:52,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 11:26:52,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +55: [2023-04-29 11:26:52,211] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +55: [2023-04-29 11:26:52,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +55: [2023-04-29 11:26:52,211] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +55: [2023-04-29 11:26:52,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +55: [2023-04-29 11:26:52,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +55: [2023-04-29 11:26:52,212] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +25: [2023-04-29 11:26:52,212] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 206 +49: [2023-04-29 11:26:52,212] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 396 +23: [2023-04-29 11:26:52,215] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +18: [2023-04-29 11:26:52,216] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 150 +23: [2023-04-29 11:26:52,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +23: [2023-04-29 11:26:52,216] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +23: [2023-04-29 11:26:52,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +53: [2023-04-29 11:26:52,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt. +53: [2023-04-29 11:26:52,220] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 430 +50: [2023-04-29 11:26:52,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt. +50: [2023-04-29 11:26:52,221] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 400 +23: [2023-04-29 11:26:52,221] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +23: [2023-04-29 11:26:52,224] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +25: [2023-04-29 11:26:52,225] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt. +25: [2023-04-29 11:26:52,225] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 200 +20: [2023-04-29 11:26:52,225] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +53: [2023-04-29 11:26:52,228] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 430 +20: [2023-04-29 11:26:52,228] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +20: [2023-04-29 11:26:52,229] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +50: [2023-04-29 11:26:52,229] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 400 +32: [2023-04-29 11:26:52,231] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt. +32: [2023-04-29 11:26:52,231] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 256 +20: [2023-04-29 11:26:52,232] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +25: [2023-04-29 11:26:52,233] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 200 +41: [2023-04-29 11:26:52,234] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 11:26:52,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt. +41: [2023-04-29 11:26:52,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 11:26:52,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +37: [2023-04-29 11:26:52,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +37: [2023-04-29 11:26:52,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +42: [2023-04-29 11:26:52,235] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 340 +37: [2023-04-29 11:26:52,235] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +35: [2023-04-29 11:26:52,236] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +41: [2023-04-29 11:26:52,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 11:26:52,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +41: [2023-04-29 11:26:52,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 11:26:52,237] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +43: [2023-04-29 11:26:52,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt. +50: [2023-04-29 11:26:52,237] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt. +50: [2023-04-29 11:26:52,238] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 406 +43: [2023-04-29 11:26:52,238] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 347 +32: [2023-04-29 11:26:52,239] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 256 +41: [2023-04-29 11:26:52,240] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 11:26:52,240] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +41: [2023-04-29 11:26:52,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +41: [2023-04-29 11:26:52,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +41: [2023-04-29 11:26:52,241] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 11:26:52,241] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +41: [2023-04-29 11:26:52,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +41: [2023-04-29 11:26:52,242] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +41: [2023-04-29 11:26:52,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +41: [2023-04-29 11:26:52,242] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +38: [2023-04-29 11:26:52,243] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt. +38: [2023-04-29 11:26:52,244] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 305 +42: [2023-04-29 11:26:52,245] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 340 +33: [2023-04-29 11:26:52,246] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt. +33: [2023-04-29 11:26:52,246] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 269 +50: [2023-04-29 11:26:52,247] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 406 +35: [2023-04-29 11:26:52,249] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +42: [2023-04-29 11:26:52,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 11:26:52,250] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +55: [2023-04-29 11:26:52,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt... +55: [2023-04-29 11:26:52,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt... +55: [2023-04-29 11:26:52,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt... +55: [2023-04-29 11:26:52,253] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt... +42: [2023-04-29 11:26:52,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +42: [2023-04-29 11:26:52,255] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +63: [2023-04-29 11:26:52,256] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt. +63: [2023-04-29 11:26:52,256] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 511 +42: [2023-04-29 11:26:52,257] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. + 9: [2023-04-29 11:26:52,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +35: [2023-04-29 11:26:52,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 11:26:52,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +35: [2023-04-29 11:26:52,259] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +43: [2023-04-29 11:26:52,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt. +43: [2023-04-29 11:26:52,261] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 351 +42: [2023-04-29 11:26:52,262] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_00-model_states.pt. +42: [2023-04-29 11:26:52,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 9: [2023-04-29 11:26:52,262] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +31: [2023-04-29 11:26:52,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +31: [2023-04-29 11:26:52,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +31: [2023-04-29 11:26:52,263] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +37: [2023-04-29 11:26:52,264] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +31: [2023-04-29 11:26:52,264] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +37: [2023-04-29 11:26:52,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 11:26:52,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +34: [2023-04-29 11:26:52,265] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +37: [2023-04-29 11:26:52,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +35: [2023-04-29 11:26:52,266] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 8: [2023-04-29 11:26:52,266] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +34: [2023-04-29 11:26:52,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +35: [2023-04-29 11:26:52,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +30: [2023-04-29 11:26:52,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt. +30: [2023-04-29 11:26:52,267] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 244 +34: [2023-04-29 11:26:52,267] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +35: [2023-04-29 11:26:52,267] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... + 8: [2023-04-29 11:26:52,268] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +42: [2023-04-29 11:26:52,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt... +37: [2023-04-29 11:26:52,268] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 11:26:52,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +37: [2023-04-29 11:26:52,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 11:26:52,269] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 11:26:52,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +37: [2023-04-29 11:26:52,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +37: [2023-04-29 11:26:52,269] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 11:26:52,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt. +37: [2023-04-29 11:26:52,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +37: [2023-04-29 11:26:52,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +51: [2023-04-29 11:26:52,270] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 411 +37: [2023-04-29 11:26:52,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +37: [2023-04-29 11:26:52,270] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +37: [2023-04-29 11:26:52,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +13: [2023-04-29 11:26:52,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt. +37: [2023-04-29 11:26:52,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +13: [2023-04-29 11:26:52,271] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 106 + 9: [2023-04-29 11:26:52,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 8: [2023-04-29 11:26:52,273] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 8: [2023-04-29 11:26:52,274] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +30: [2023-04-29 11:26:52,274] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 244 +22: [2023-04-29 11:26:52,274] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt. +22: [2023-04-29 11:26:52,275] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 178 + 8: [2023-04-29 11:26:52,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +35: [2023-04-29 11:26:52,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt. +35: [2023-04-29 11:26:52,276] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 282 + 9: [2023-04-29 11:26:52,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +29: [2023-04-29 11:26:52,276] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt. +29: [2023-04-29 11:26:52,276] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 232 + 9: [2023-04-29 11:26:52,277] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 9: [2023-04-29 11:26:52,278] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 11:26:52,279] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 106 + 8: [2023-04-29 11:26:52,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +20: [2023-04-29 11:26:52,279] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 11:26:52,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +28: [2023-04-29 11:26:52,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 8: [2023-04-29 11:26:52,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +22: [2023-04-29 11:26:52,282] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 178 + 9: [2023-04-29 11:26:52,282] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +29: [2023-04-29 11:26:52,283] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 232 +22: [2023-04-29 11:26:52,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt. +22: [2023-04-29 11:26:52,284] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 182 + 9: [2023-04-29 11:26:52,284] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +28: [2023-04-29 11:26:52,284] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +20: [2023-04-29 11:26:52,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +28: [2023-04-29 11:26:52,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +35: [2023-04-29 11:26:52,285] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 282 +13: [2023-04-29 11:26:52,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt. + 8: [2023-04-29 11:26:52,285] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +13: [2023-04-29 11:26:52,285] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 104 +41: [2023-04-29 11:26:52,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt... +41: [2023-04-29 11:26:52,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt... +41: [2023-04-29 11:26:52,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt... +41: [2023-04-29 11:26:52,287] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt... +60: [2023-04-29 11:26:52,288] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt. +60: [2023-04-29 11:26:52,288] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 485 +30: [2023-04-29 11:26:52,289] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt. +30: [2023-04-29 11:26:52,290] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 246 +31: [2023-04-29 11:26:52,290] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 11:26:52,291] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 182 +31: [2023-04-29 11:26:52,291] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +34: [2023-04-29 11:26:52,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +31: [2023-04-29 11:26:52,293] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 11:26:52,293] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 104 +34: [2023-04-29 11:26:52,293] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +20: [2023-04-29 11:26:52,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +34: [2023-04-29 11:26:52,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 11:26:52,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +31: [2023-04-29 11:26:52,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +34: [2023-04-29 11:26:52,294] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 11:26:52,294] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +30: [2023-04-29 11:26:52,296] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 246 +34: [2023-04-29 11:26:52,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +34: [2023-04-29 11:26:52,297] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +20: [2023-04-29 11:26:52,299] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +62: [2023-04-29 11:26:52,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt. +62: [2023-04-29 11:26:52,301] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 501 +34: [2023-04-29 11:26:52,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +20: [2023-04-29 11:26:52,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +34: [2023-04-29 11:26:52,301] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +34: [2023-04-29 11:26:52,301] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 11:26:52,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +34: [2023-04-29 11:26:52,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +34: [2023-04-29 11:26:52,302] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +34: [2023-04-29 11:26:52,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +34: [2023-04-29 11:26:52,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +54: [2023-04-29 11:26:52,302] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt. +54: [2023-04-29 11:26:52,302] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 439 +20: [2023-04-29 11:26:52,304] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +35: [2023-04-29 11:26:52,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt. +35: [2023-04-29 11:26:52,307] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 280 +20: [2023-04-29 11:26:52,309] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +32: [2023-04-29 11:26:52,309] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt. +32: [2023-04-29 11:26:52,310] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 262 +20: [2023-04-29 11:26:52,311] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +28: [2023-04-29 11:26:52,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 11:26:52,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 11:26:52,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 11:26:52,313] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +52: [2023-04-29 11:26:52,313] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt. +52: [2023-04-29 11:26:52,314] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 418 +18: [2023-04-29 11:26:52,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt. +18: [2023-04-29 11:26:52,314] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 144 +12: [2023-04-29 11:26:52,314] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt. +12: [2023-04-29 11:26:52,314] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 96 +35: [2023-04-29 11:26:52,315] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 280 +49: [2023-04-29 11:26:52,315] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt. +49: [2023-04-29 11:26:52,316] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 393 +44: [2023-04-29 11:26:52,316] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt. +44: [2023-04-29 11:26:52,316] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 356 +37: [2023-04-29 11:26:52,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt... +37: [2023-04-29 11:26:52,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt... +37: [2023-04-29 11:26:52,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt... +37: [2023-04-29 11:26:52,316] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt... +51: [2023-04-29 11:26:52,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt. +51: [2023-04-29 11:26:52,318] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 409 +32: [2023-04-29 11:26:52,318] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 262 +29: [2023-04-29 11:26:52,318] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt. +29: [2023-04-29 11:26:52,318] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 234 +52: [2023-04-29 11:26:52,321] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 418 +12: [2023-04-29 11:26:52,321] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 96 +27: [2023-04-29 11:26:52,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +27: [2023-04-29 11:26:52,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +27: [2023-04-29 11:26:52,321] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +18: [2023-04-29 11:26:52,322] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 144 +27: [2023-04-29 11:26:52,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +10: [2023-04-29 11:26:52,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +10: [2023-04-29 11:26:52,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +10: [2023-04-29 11:26:52,322] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +10: [2023-04-29 11:26:52,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +25: [2023-04-29 11:26:52,323] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt. +25: [2023-04-29 11:26:52,323] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 204 +44: [2023-04-29 11:26:52,323] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 356 +39: [2023-04-29 11:26:52,325] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt. +29: [2023-04-29 11:26:52,325] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 234 +39: [2023-04-29 11:26:52,325] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 313 +56: [2023-04-29 11:26:52,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +56: [2023-04-29 11:26:52,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +56: [2023-04-29 11:26:52,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +56: [2023-04-29 11:26:52,327] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +24: [2023-04-29 11:26:52,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +24: [2023-04-29 11:26:52,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +24: [2023-04-29 11:26:52,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +24: [2023-04-29 11:26:52,328] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +25: [2023-04-29 11:26:52,331] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 204 +48: [2023-04-29 11:26:52,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +48: [2023-04-29 11:26:52,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +48: [2023-04-29 11:26:52,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +48: [2023-04-29 11:26:52,333] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. + 1: [2023-04-29 11:26:52,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt. +35: [2023-04-29 11:26:52,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt. + 1: [2023-04-29 11:26:52,336] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 12 +35: [2023-04-29 11:26:52,337] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 284 +51: [2023-04-29 11:26:52,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt. +51: [2023-04-29 11:26:52,338] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 415 +34: [2023-04-29 11:26:52,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt... +34: [2023-04-29 11:26:52,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt... +34: [2023-04-29 11:26:52,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt... +34: [2023-04-29 11:26:52,343] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt... + 1: [2023-04-29 11:26:52,345] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 12 +29: [2023-04-29 11:26:52,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt. +29: [2023-04-29 11:26:52,345] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 238 +39: [2023-04-29 11:26:52,345] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt. +35: [2023-04-29 11:26:52,345] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 284 +39: [2023-04-29 11:26:52,345] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 317 +30: [2023-04-29 11:26:52,347] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt. +30: [2023-04-29 11:26:52,348] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 242 +21: [2023-04-29 11:26:52,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +21: [2023-04-29 11:26:52,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +21: [2023-04-29 11:26:52,348] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +19: [2023-04-29 11:26:52,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +19: [2023-04-29 11:26:52,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +21: [2023-04-29 11:26:52,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +19: [2023-04-29 11:26:52,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +19: [2023-04-29 11:26:52,349] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +12: [2023-04-29 11:26:52,352] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt. +12: [2023-04-29 11:26:52,352] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 98 +29: [2023-04-29 11:26:52,352] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 238 +27: [2023-04-29 11:26:52,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 11:26:52,353] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +51: [2023-04-29 11:26:52,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt. +51: [2023-04-29 11:26:52,354] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 413 +17: [2023-04-29 11:26:52,355] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt. +17: [2023-04-29 11:26:52,355] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 140 +48: [2023-04-29 11:26:52,355] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 11:26:52,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +31: [2023-04-29 11:26:52,356] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +30: [2023-04-29 11:26:52,356] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 242 +56: [2023-04-29 11:26:52,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +27: [2023-04-29 11:26:52,356] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +56: [2023-04-29 11:26:52,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +27: [2023-04-29 11:26:52,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +56: [2023-04-29 11:26:52,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 11:26:52,357] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 11:26:52,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +24: [2023-04-29 11:26:52,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +56: [2023-04-29 11:26:52,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +56: [2023-04-29 11:26:52,357] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +56: [2023-04-29 11:26:52,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 11:26:52,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +48: [2023-04-29 11:26:52,358] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +29: [2023-04-29 11:26:52,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt. +29: [2023-04-29 11:26:52,358] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 236 +14: [2023-04-29 11:26:52,358] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt. +14: [2023-04-29 11:26:52,358] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 114 +31: [2023-04-29 11:26:52,359] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +56: [2023-04-29 11:26:52,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +12: [2023-04-29 11:26:52,360] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 98 +56: [2023-04-29 11:26:52,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +56: [2023-04-29 11:26:52,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +56: [2023-04-29 11:26:52,360] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +56: [2023-04-29 11:26:52,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +56: [2023-04-29 11:26:52,360] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +56: [2023-04-29 11:26:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +44: [2023-04-29 11:26:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +24: [2023-04-29 11:26:52,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +44: [2023-04-29 11:26:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +48: [2023-04-29 11:26:52,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +48: [2023-04-29 11:26:52,361] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 11:26:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +44: [2023-04-29 11:26:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +48: [2023-04-29 11:26:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 11:26:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +48: [2023-04-29 11:26:52,361] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +48: [2023-04-29 11:26:52,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +48: [2023-04-29 11:26:52,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +17: [2023-04-29 11:26:52,362] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 140 +31: [2023-04-29 11:26:52,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +48: [2023-04-29 11:26:52,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +24: [2023-04-29 11:26:52,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +48: [2023-04-29 11:26:52,362] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +24: [2023-04-29 11:26:52,362] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +38: [2023-04-29 11:26:52,363] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt. +38: [2023-04-29 11:26:52,363] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 307 +31: [2023-04-29 11:26:52,365] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +61: [2023-04-29 11:26:52,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +61: [2023-04-29 11:26:52,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +61: [2023-04-29 11:26:52,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +29: [2023-04-29 11:26:52,365] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 236 +17: [2023-04-29 11:26:52,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt. +61: [2023-04-29 11:26:52,365] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +17: [2023-04-29 11:26:52,365] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 142 +48: [2023-04-29 11:26:52,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 11:26:52,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +45: [2023-04-29 11:26:52,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +45: [2023-04-29 11:26:52,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +48: [2023-04-29 11:26:52,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +14: [2023-04-29 11:26:52,366] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 114 +48: [2023-04-29 11:26:52,366] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +45: [2023-04-29 11:26:52,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +15: [2023-04-29 11:26:52,366] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt. +15: [2023-04-29 11:26:52,366] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 122 +48: [2023-04-29 11:26:52,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +40: [2023-04-29 11:26:52,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +40: [2023-04-29 11:26:52,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +40: [2023-04-29 11:26:52,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +40: [2023-04-29 11:26:52,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +36: [2023-04-29 11:26:52,368] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt. +36: [2023-04-29 11:26:52,369] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 291 + 5: [2023-04-29 11:26:52,369] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt. +31: [2023-04-29 11:26:52,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 11:26:52,370] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 40 +58: [2023-04-29 11:26:52,370] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt. +58: [2023-04-29 11:26:52,370] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 471 +54: [2023-04-29 11:26:52,371] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt. +54: [2023-04-29 11:26:52,371] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 435 +17: [2023-04-29 11:26:52,372] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 142 +31: [2023-04-29 11:26:52,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 11:26:52,373] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 122 +57: [2023-04-29 11:26:52,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +57: [2023-04-29 11:26:52,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +57: [2023-04-29 11:26:52,373] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +57: [2023-04-29 11:26:52,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +58: [2023-04-29 11:26:52,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt. +58: [2023-04-29 11:26:52,374] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 465 +28: [2023-04-29 11:26:52,374] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 11:26:52,375] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +62: [2023-04-29 11:26:52,376] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt. +62: [2023-04-29 11:26:52,376] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 503 +31: [2023-04-29 11:26:52,378] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +17: [2023-04-29 11:26:52,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +17: [2023-04-29 11:26:52,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +17: [2023-04-29 11:26:52,378] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +17: [2023-04-29 11:26:52,379] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 5: [2023-04-29 11:26:52,379] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 40 +31: [2023-04-29 11:26:52,379] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +28: [2023-04-29 11:26:52,380] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +31: [2023-04-29 11:26:52,380] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt. +31: [2023-04-29 11:26:52,381] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 254 +53: [2023-04-29 11:26:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +53: [2023-04-29 11:26:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +53: [2023-04-29 11:26:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +60: [2023-04-29 11:26:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt. +53: [2023-04-29 11:26:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +60: [2023-04-29 11:26:52,381] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 481 + 4: [2023-04-29 11:26:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 4: [2023-04-29 11:26:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 4: [2023-04-29 11:26:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +49: [2023-04-29 11:26:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt. + 4: [2023-04-29 11:26:52,381] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +49: [2023-04-29 11:26:52,382] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 397 +28: [2023-04-29 11:26:52,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +28: [2023-04-29 11:26:52,383] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +21: [2023-04-29 11:26:52,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 11:26:52,383] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +28: [2023-04-29 11:26:52,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 7: [2023-04-29 11:26:52,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 7: [2023-04-29 11:26:52,385] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +21: [2023-04-29 11:26:52,386] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 11:26:52,386] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt. +63: [2023-04-29 11:26:52,386] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 507 + 7: [2023-04-29 11:26:52,387] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +31: [2023-04-29 11:26:52,387] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 254 +28: [2023-04-29 11:26:52,388] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 7: [2023-04-29 11:26:52,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +14: [2023-04-29 11:26:52,388] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt. +14: [2023-04-29 11:26:52,388] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 118 +58: [2023-04-29 11:26:52,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt. +22: [2023-04-29 11:26:52,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +22: [2023-04-29 11:26:52,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +58: [2023-04-29 11:26:52,389] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 469 +44: [2023-04-29 11:26:52,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +22: [2023-04-29 11:26:52,389] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +44: [2023-04-29 11:26:52,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 11:26:52,389] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:52,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +22: [2023-04-29 11:26:52,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +44: [2023-04-29 11:26:52,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +28: [2023-04-29 11:26:52,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +44: [2023-04-29 11:26:52,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 11:26:52,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 11:26:52,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +60: [2023-04-29 11:26:52,390] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt. +60: [2023-04-29 11:26:52,391] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 487 +10: [2023-04-29 11:26:52,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt... +10: [2023-04-29 11:26:52,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt... +10: [2023-04-29 11:26:52,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt... +10: [2023-04-29 11:26:52,390] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt... +44: [2023-04-29 11:26:52,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +44: [2023-04-29 11:26:52,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +44: [2023-04-29 11:26:52,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +61: [2023-04-29 11:26:52,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +28: [2023-04-29 11:26:52,391] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +44: [2023-04-29 11:26:52,392] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +44: [2023-04-29 11:26:52,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +44: [2023-04-29 11:26:52,393] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +44: [2023-04-29 11:26:52,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +44: [2023-04-29 11:26:52,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +44: [2023-04-29 11:26:52,393] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +45: [2023-04-29 11:26:52,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 11:26:52,394] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +45: [2023-04-29 11:26:52,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 11:26:52,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 11:26:52,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt. +61: [2023-04-29 11:26:52,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +44: [2023-04-29 11:26:52,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +35: [2023-04-29 11:26:52,395] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 286 +26: [2023-04-29 11:26:52,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +26: [2023-04-29 11:26:52,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +33: [2023-04-29 11:26:52,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt. +26: [2023-04-29 11:26:52,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +45: [2023-04-29 11:26:52,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +45: [2023-04-29 11:26:52,395] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +33: [2023-04-29 11:26:52,395] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 271 +16: [2023-04-29 11:26:52,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +16: [2023-04-29 11:26:52,395] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +61: [2023-04-29 11:26:52,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +51: [2023-04-29 11:26:52,396] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 415 +40: [2023-04-29 11:26:52,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 11:26:52,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +26: [2023-04-29 11:26:52,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt. +26: [2023-04-29 11:26:52,396] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 208 +61: [2023-04-29 11:26:52,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 11:26:52,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +51: [2023-04-29 11:26:52,396] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 409 +14: [2023-04-29 11:26:52,396] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 118 +40: [2023-04-29 11:26:52,396] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 11:26:52,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 11:26:52,396] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:52,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +51: [2023-04-29 11:26:52,397] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 413 +51: [2023-04-29 11:26:52,397] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 411 +61: [2023-04-29 11:26:52,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +61: [2023-04-29 11:26:52,397] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +28: [2023-04-29 11:26:52,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt. +28: [2023-04-29 11:26:52,397] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 226 +61: [2023-04-29 11:26:52,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +40: [2023-04-29 11:26:52,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +40: [2023-04-29 11:26:52,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +40: [2023-04-29 11:26:52,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:52,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +40: [2023-04-29 11:26:52,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:52,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 11:26:52,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +40: [2023-04-29 11:26:52,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 11:26:52,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:52,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +40: [2023-04-29 11:26:52,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +40: [2023-04-29 11:26:52,398] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +61: [2023-04-29 11:26:52,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +45: [2023-04-29 11:26:52,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 11:26:52,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +16: [2023-04-29 11:26:52,399] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +57: [2023-04-29 11:26:52,399] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +26: [2023-04-29 11:26:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +45: [2023-04-29 11:26:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +45: [2023-04-29 11:26:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +40: [2023-04-29 11:26:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +40: [2023-04-29 11:26:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +40: [2023-04-29 11:26:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +40: [2023-04-29 11:26:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +45: [2023-04-29 11:26:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +57: [2023-04-29 11:26:52,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +16: [2023-04-29 11:26:52,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +11: [2023-04-29 11:26:52,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +11: [2023-04-29 11:26:52,401] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +57: [2023-04-29 11:26:52,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 11:26:52,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 11:26:52,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +57: [2023-04-29 11:26:52,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +32: [2023-04-29 11:26:52,402] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt. +57: [2023-04-29 11:26:52,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +32: [2023-04-29 11:26:52,402] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 263 +45: [2023-04-29 11:26:52,402] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +57: [2023-04-29 11:26:52,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 11:26:52,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +26: [2023-04-29 11:26:52,403] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 208 +45: [2023-04-29 11:26:52,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +45: [2023-04-29 11:26:52,403] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +11: [2023-04-29 11:26:52,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +11: [2023-04-29 11:26:52,403] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +56: [2023-04-29 11:26:52,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt... +56: [2023-04-29 11:26:52,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt... +56: [2023-04-29 11:26:52,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt... +56: [2023-04-29 11:26:52,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt... +45: [2023-04-29 11:26:52,404] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +48: [2023-04-29 11:26:52,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt... +48: [2023-04-29 11:26:52,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt... +48: [2023-04-29 11:26:52,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt... +48: [2023-04-29 11:26:52,404] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt... +35: [2023-04-29 11:26:52,404] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 286 +57: [2023-04-29 11:26:52,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +57: [2023-04-29 11:26:52,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +57: [2023-04-29 11:26:52,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +61: [2023-04-29 11:26:52,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt. +61: [2023-04-29 11:26:52,405] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 494 +57: [2023-04-29 11:26:52,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +57: [2023-04-29 11:26:52,405] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +57: [2023-04-29 11:26:52,405] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +28: [2023-04-29 11:26:52,406] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 226 +57: [2023-04-29 11:26:52,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +52: [2023-04-29 11:26:52,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +52: [2023-04-29 11:26:52,406] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. + 3: [2023-04-29 11:26:52,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt. +32: [2023-04-29 11:26:52,408] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt. + 3: [2023-04-29 11:26:52,408] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 24 +32: [2023-04-29 11:26:52,408] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 260 +22: [2023-04-29 11:26:52,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt. +27: [2023-04-29 11:26:52,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +52: [2023-04-29 11:26:52,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +22: [2023-04-29 11:26:52,409] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 176 +52: [2023-04-29 11:26:52,409] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +53: [2023-04-29 11:26:52,409] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 11:26:52,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +53: [2023-04-29 11:26:52,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +63: [2023-04-29 11:26:52,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt. +63: [2023-04-29 11:26:52,410] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 505 +53: [2023-04-29 11:26:52,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 11:26:52,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 11:26:52,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +15: [2023-04-29 11:26:52,410] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt. +53: [2023-04-29 11:26:52,410] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +15: [2023-04-29 11:26:52,411] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 120 +24: [2023-04-29 11:26:52,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt. + 7: [2023-04-29 11:26:52,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 7: [2023-04-29 11:26:52,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +53: [2023-04-29 11:26:52,411] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 11:26:52,411] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... + 2: [2023-04-29 11:26:52,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 2: [2023-04-29 11:26:52,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 2: [2023-04-29 11:26:52,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +61: [2023-04-29 11:26:52,412] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 494 + 2: [2023-04-29 11:26:52,412] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +53: [2023-04-29 11:26:52,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +24: [2023-04-29 11:26:52,411] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 194 +53: [2023-04-29 11:26:52,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +53: [2023-04-29 11:26:52,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +27: [2023-04-29 11:26:52,413] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +53: [2023-04-29 11:26:52,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +53: [2023-04-29 11:26:52,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +53: [2023-04-29 11:26:52,413] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +21: [2023-04-29 11:26:52,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt. + 8: [2023-04-29 11:26:52,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt. +53: [2023-04-29 11:26:52,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +21: [2023-04-29 11:26:52,414] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 168 + 8: [2023-04-29 11:26:52,414] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 64 +38: [2023-04-29 11:26:52,414] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt. +38: [2023-04-29 11:26:52,414] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 311 +32: [2023-04-29 11:26:52,415] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt. + 7: [2023-04-29 11:26:52,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +32: [2023-04-29 11:26:52,415] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 258 + 7: [2023-04-29 11:26:52,415] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 3: [2023-04-29 11:26:52,416] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 24 +32: [2023-04-29 11:26:52,417] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 260 +24: [2023-04-29 11:26:52,418] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 194 +22: [2023-04-29 11:26:52,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 11:26:52,418] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +15: [2023-04-29 11:26:52,418] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 120 +21: [2023-04-29 11:26:52,420] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 168 +19: [2023-04-29 11:26:52,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt... +19: [2023-04-29 11:26:52,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt... +19: [2023-04-29 11:26:52,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt... +19: [2023-04-29 11:26:52,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt... +22: [2023-04-29 11:26:52,421] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 176 +22: [2023-04-29 11:26:52,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +27: [2023-04-29 11:26:52,421] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +26: [2023-04-29 11:26:52,421] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +49: [2023-04-29 11:26:52,421] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 397 + 8: [2023-04-29 11:26:52,422] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 64 +32: [2023-04-29 11:26:52,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt. +32: [2023-04-29 11:26:52,422] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 261 +54: [2023-04-29 11:26:52,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt. +32: [2023-04-29 11:26:52,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt. +43: [2023-04-29 11:26:52,422] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt. +54: [2023-04-29 11:26:52,423] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 433 +43: [2023-04-29 11:26:52,423] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 349 +32: [2023-04-29 11:26:52,423] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 259 +32: [2023-04-29 11:26:52,423] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 258 +49: [2023-04-29 11:26:52,424] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 393 +27: [2023-04-29 11:26:52,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +29: [2023-04-29 11:26:52,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +29: [2023-04-29 11:26:52,424] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +29: [2023-04-29 11:26:52,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +29: [2023-04-29 11:26:52,425] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +16: [2023-04-29 11:26:52,425] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 11:26:52,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +22: [2023-04-29 11:26:52,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +16: [2023-04-29 11:26:52,426] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +63: [2023-04-29 11:26:52,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt. +63: [2023-04-29 11:26:52,427] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 509 +49: [2023-04-29 11:26:52,427] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt. +49: [2023-04-29 11:26:52,427] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 399 +12: [2023-04-29 11:26:52,428] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt. +27: [2023-04-29 11:26:52,428] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +12: [2023-04-29 11:26:52,428] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 102 +24: [2023-04-29 11:26:52,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 11:26:52,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +27: [2023-04-29 11:26:52,430] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +22: [2023-04-29 11:26:52,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt. +36: [2023-04-29 11:26:52,431] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 291 +22: [2023-04-29 11:26:52,431] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 180 + 8: [2023-04-29 11:26:52,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt. + 8: [2023-04-29 11:26:52,431] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 70 +24: [2023-04-29 11:26:52,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt. +26: [2023-04-29 11:26:52,431] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 11:26:52,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +13: [2023-04-29 11:26:52,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +13: [2023-04-29 11:26:52,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +24: [2023-04-29 11:26:52,432] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 196 +26: [2023-04-29 11:26:52,432] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +13: [2023-04-29 11:26:52,432] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +52: [2023-04-29 11:26:52,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +24: [2023-04-29 11:26:52,433] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +52: [2023-04-29 11:26:52,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +24: [2023-04-29 11:26:52,433] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +52: [2023-04-29 11:26:52,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +49: [2023-04-29 11:26:52,434] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 399 +52: [2023-04-29 11:26:52,434] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +27: [2023-04-29 11:26:52,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +61: [2023-04-29 11:26:52,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt... +61: [2023-04-29 11:26:52,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt... +16: [2023-04-29 11:26:52,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +61: [2023-04-29 11:26:52,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt... +61: [2023-04-29 11:26:52,434] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt... +50: [2023-04-29 11:26:52,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +50: [2023-04-29 11:26:52,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +44: [2023-04-29 11:26:52,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt... +44: [2023-04-29 11:26:52,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt... +50: [2023-04-29 11:26:52,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +44: [2023-04-29 11:26:52,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt... +44: [2023-04-29 11:26:52,435] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt... +50: [2023-04-29 11:26:52,435] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +58: [2023-04-29 11:26:52,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt. +12: [2023-04-29 11:26:52,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +58: [2023-04-29 11:26:52,436] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 467 +15: [2023-04-29 11:26:52,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +12: [2023-04-29 11:26:52,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +12: [2023-04-29 11:26:52,436] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 102 +15: [2023-04-29 11:26:52,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +15: [2023-04-29 11:26:52,436] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +15: [2023-04-29 11:26:52,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +12: [2023-04-29 11:26:52,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +12: [2023-04-29 11:26:52,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +26: [2023-04-29 11:26:52,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +52: [2023-04-29 11:26:52,437] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +52: [2023-04-29 11:26:52,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +24: [2023-04-29 11:26:52,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +52: [2023-04-29 11:26:52,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... + 8: [2023-04-29 11:26:52,438] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 70 +52: [2023-04-29 11:26:52,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +52: [2023-04-29 11:26:52,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +22: [2023-04-29 11:26:52,438] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 180 +52: [2023-04-29 11:26:52,438] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +24: [2023-04-29 11:26:52,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +52: [2023-04-29 11:26:52,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +52: [2023-04-29 11:26:52,439] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +45: [2023-04-29 11:26:52,439] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt. +45: [2023-04-29 11:26:52,440] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 360 +24: [2023-04-29 11:26:52,440] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 196 +43: [2023-04-29 11:26:52,442] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 345 + 2: [2023-04-29 11:26:52,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +52: [2023-04-29 11:26:52,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +52: [2023-04-29 11:26:52,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +52: [2023-04-29 11:26:52,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +24: [2023-04-29 11:26:52,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +52: [2023-04-29 11:26:52,442] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +40: [2023-04-29 11:26:52,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt... +40: [2023-04-29 11:26:52,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt... +40: [2023-04-29 11:26:52,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt... +40: [2023-04-29 11:26:52,442] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt... + 2: [2023-04-29 11:26:52,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +24: [2023-04-29 11:26:52,443] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 2: [2023-04-29 11:26:52,444] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... + 0: [2023-04-29 11:26:52,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 0: [2023-04-29 11:26:52,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 0: [2023-04-29 11:26:52,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 0: [2023-04-29 11:26:52,444] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 2: [2023-04-29 11:26:52,445] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +54: [2023-04-29 11:26:52,445] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt. +54: [2023-04-29 11:26:52,445] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 437 +21: [2023-04-29 11:26:52,446] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +60: [2023-04-29 11:26:52,447] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt. +60: [2023-04-29 11:26:52,447] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 483 +52: [2023-04-29 11:26:52,448] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt. +52: [2023-04-29 11:26:52,448] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 420 +24: [2023-04-29 11:26:52,448] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 5: [2023-04-29 11:26:52,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt. +24: [2023-04-29 11:26:52,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt. +45: [2023-04-29 11:26:52,449] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 360 + 5: [2023-04-29 11:26:52,449] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt. +24: [2023-04-29 11:26:52,449] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 198 + 5: [2023-04-29 11:26:52,449] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 44 + 5: [2023-04-29 11:26:52,449] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 46 +21: [2023-04-29 11:26:52,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +43: [2023-04-29 11:26:52,452] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 347 +45: [2023-04-29 11:26:52,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt... +45: [2023-04-29 11:26:52,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt... +45: [2023-04-29 11:26:52,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt... +45: [2023-04-29 11:26:52,452] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt... +21: [2023-04-29 11:26:52,452] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +43: [2023-04-29 11:26:52,453] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 349 +57: [2023-04-29 11:26:52,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt... +57: [2023-04-29 11:26:52,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt... +57: [2023-04-29 11:26:52,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt... +57: [2023-04-29 11:26:52,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt... +36: [2023-04-29 11:26:52,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt. +29: [2023-04-29 11:26:52,453] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +36: [2023-04-29 11:26:52,453] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 289 +17: [2023-04-29 11:26:52,455] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt. +29: [2023-04-29 11:26:52,455] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +52: [2023-04-29 11:26:52,455] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 420 +17: [2023-04-29 11:26:52,456] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 138 + 4: [2023-04-29 11:26:52,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt... + 4: [2023-04-29 11:26:52,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt... + 4: [2023-04-29 11:26:52,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt... + 4: [2023-04-29 11:26:52,456] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt... + 5: [2023-04-29 11:26:52,457] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 44 +53: [2023-04-29 11:26:52,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt... +53: [2023-04-29 11:26:52,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt... +53: [2023-04-29 11:26:52,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt... +53: [2023-04-29 11:26:52,457] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt... +24: [2023-04-29 11:26:52,457] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 198 + 5: [2023-04-29 11:26:52,457] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 46 +21: [2023-04-29 11:26:52,458] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 5: [2023-04-29 11:26:52,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 5: [2023-04-29 11:26:52,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 5: [2023-04-29 11:26:52,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. + 5: [2023-04-29 11:26:52,458] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_22-model_01-model_states.pt. +43: [2023-04-29 11:26:52,459] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 351 +29: [2023-04-29 11:26:52,459] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +21: [2023-04-29 11:26:52,460] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt. +21: [2023-04-29 11:26:52,460] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 170 +36: [2023-04-29 11:26:52,461] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 289 +13: [2023-04-29 11:26:52,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 11:26:52,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt... +17: [2023-04-29 11:26:52,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt... +13: [2023-04-29 11:26:52,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +17: [2023-04-29 11:26:52,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt... +17: [2023-04-29 11:26:52,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt... +50: [2023-04-29 11:26:52,461] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +26: [2023-04-29 11:26:52,461] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt. +26: [2023-04-29 11:26:52,462] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 214 +50: [2023-04-29 11:26:52,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +50: [2023-04-29 11:26:52,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +29: [2023-04-29 11:26:52,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +50: [2023-04-29 11:26:52,462] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +50: [2023-04-29 11:26:52,462] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 11:26:52,463] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +21: [2023-04-29 11:26:52,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 11:26:52,463] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 138 + 7: [2023-04-29 11:26:52,463] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 11:26:52,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 3: [2023-04-29 11:26:52,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +50: [2023-04-29 11:26:52,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 3: [2023-04-29 11:26:52,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +50: [2023-04-29 11:26:52,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +13: [2023-04-29 11:26:52,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +20: [2023-04-29 11:26:52,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt. +50: [2023-04-29 11:26:52,464] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... + 3: [2023-04-29 11:26:52,464] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +13: [2023-04-29 11:26:52,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +50: [2023-04-29 11:26:52,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +20: [2023-04-29 11:26:52,465] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 162 +50: [2023-04-29 11:26:52,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +50: [2023-04-29 11:26:52,465] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +50: [2023-04-29 11:26:52,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +50: [2023-04-29 11:26:52,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +50: [2023-04-29 11:26:52,465] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +21: [2023-04-29 11:26:52,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +50: [2023-04-29 11:26:52,466] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +31: [2023-04-29 11:26:52,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt. + 7: [2023-04-29 11:26:52,467] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +31: [2023-04-29 11:26:52,467] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 248 +59: [2023-04-29 11:26:52,467] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt. +21: [2023-04-29 11:26:52,468] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 170 +59: [2023-04-29 11:26:52,468] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 479 +47: [2023-04-29 11:26:52,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +47: [2023-04-29 11:26:52,469] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +11: [2023-04-29 11:26:52,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt... +11: [2023-04-29 11:26:52,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt... +11: [2023-04-29 11:26:52,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt... +11: [2023-04-29 11:26:52,469] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt... +21: [2023-04-29 11:26:52,470] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +26: [2023-04-29 11:26:52,470] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 214 +12: [2023-04-29 11:26:52,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt. +12: [2023-04-29 11:26:52,471] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 100 +20: [2023-04-29 11:26:52,471] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 162 +47: [2023-04-29 11:26:52,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +47: [2023-04-29 11:26:52,472] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +49: [2023-04-29 11:26:52,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt. + 7: [2023-04-29 11:26:52,473] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +49: [2023-04-29 11:26:52,473] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 395 +21: [2023-04-29 11:26:52,474] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +31: [2023-04-29 11:26:52,475] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 248 +32: [2023-04-29 11:26:52,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt. +26: [2023-04-29 11:26:52,477] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt. +26: [2023-04-29 11:26:52,477] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 210 +32: [2023-04-29 11:26:52,477] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 257 +12: [2023-04-29 11:26:52,479] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 100 + 7: [2023-04-29 11:26:52,479] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +26: [2023-04-29 11:26:52,479] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt. +26: [2023-04-29 11:26:52,479] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 212 + 7: [2023-04-29 11:26:52,480] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +49: [2023-04-29 11:26:52,482] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 395 +52: [2023-04-29 11:26:52,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt... +52: [2023-04-29 11:26:52,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt... +52: [2023-04-29 11:26:52,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt... +52: [2023-04-29 11:26:52,483] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt... + 7: [2023-04-29 11:26:52,484] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +14: [2023-04-29 11:26:52,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +14: [2023-04-29 11:26:52,484] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +26: [2023-04-29 11:26:52,485] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 210 +26: [2023-04-29 11:26:52,485] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +26: [2023-04-29 11:26:52,486] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 212 +14: [2023-04-29 11:26:52,486] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +22: [2023-04-29 11:26:52,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:52,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +14: [2023-04-29 11:26:52,487] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 5: [2023-04-29 11:26:52,487] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 11:26:52,488] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt. + 5: [2023-04-29 11:26:52,488] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +14: [2023-04-29 11:26:52,488] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 116 + 5: [2023-04-29 11:26:52,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +26: [2023-04-29 11:26:52,489] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 7: [2023-04-29 11:26:52,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +16: [2023-04-29 11:26:52,490] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 11:26:52,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt. +32: [2023-04-29 11:26:52,491] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 261 + 5: [2023-04-29 11:26:52,491] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 42 +32: [2023-04-29 11:26:52,491] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 257 +42: [2023-04-29 11:26:52,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +42: [2023-04-29 11:26:52,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +42: [2023-04-29 11:26:52,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. + 5: [2023-04-29 11:26:52,491] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt... +42: [2023-04-29 11:26:52,491] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +59: [2023-04-29 11:26:52,492] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt. +59: [2023-04-29 11:26:52,493] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 475 +22: [2023-04-29 11:26:52,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +22: [2023-04-29 11:26:52,493] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 8: [2023-04-29 11:26:52,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt. +24: [2023-04-29 11:26:52,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt. +32: [2023-04-29 11:26:52,494] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 263 +24: [2023-04-29 11:26:52,494] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 192 +47: [2023-04-29 11:26:52,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 11:26:52,494] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... + 8: [2023-04-29 11:26:52,494] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 66 +47: [2023-04-29 11:26:52,494] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 11:26:52,495] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +22: [2023-04-29 11:26:52,496] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +47: [2023-04-29 11:26:52,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +47: [2023-04-29 11:26:52,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... + 7: [2023-04-29 11:26:52,496] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +16: [2023-04-29 11:26:52,497] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +14: [2023-04-29 11:26:52,497] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 116 +12: [2023-04-29 11:26:52,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt... +16: [2023-04-29 11:26:52,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +47: [2023-04-29 11:26:52,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +12: [2023-04-29 11:26:52,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt... +12: [2023-04-29 11:26:52,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt... +12: [2023-04-29 11:26:52,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt... + 5: [2023-04-29 11:26:52,499] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 42 +47: [2023-04-29 11:26:52,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +47: [2023-04-29 11:26:52,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +47: [2023-04-29 11:26:52,499] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +16: [2023-04-29 11:26:52,499] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +32: [2023-04-29 11:26:52,499] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 259 +47: [2023-04-29 11:26:52,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +47: [2023-04-29 11:26:52,500] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. + 8: [2023-04-29 11:26:52,502] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 66 +16: [2023-04-29 11:26:52,502] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +24: [2023-04-29 11:26:52,502] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 192 +22: [2023-04-29 11:26:52,503] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:52,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +47: [2023-04-29 11:26:52,503] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +47: [2023-04-29 11:26:52,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. + 6: [2023-04-29 11:26:52,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 6: [2023-04-29 11:26:52,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 6: [2023-04-29 11:26:52,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +47: [2023-04-29 11:26:52,504] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... + 6: [2023-04-29 11:26:52,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +47: [2023-04-29 11:26:52,504] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +16: [2023-04-29 11:26:52,505] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +31: [2023-04-29 11:26:52,505] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt. +31: [2023-04-29 11:26:52,506] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 250 +16: [2023-04-29 11:26:52,507] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +50: [2023-04-29 11:26:52,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt... +50: [2023-04-29 11:26:52,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt... +50: [2023-04-29 11:26:52,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt... +50: [2023-04-29 11:26:52,508] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt... + 0: [2023-04-29 11:26:52,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt... + 0: [2023-04-29 11:26:52,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt... + 0: [2023-04-29 11:26:52,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt... + 0: [2023-04-29 11:26:52,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt... +35: [2023-04-29 11:26:52,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +35: [2023-04-29 11:26:52,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +35: [2023-04-29 11:26:52,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +35: [2023-04-29 11:26:52,509] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_44-model_01-model_states.pt. +16: [2023-04-29 11:26:52,509] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +26: [2023-04-29 11:26:52,510] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +22: [2023-04-29 11:26:52,511] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +39: [2023-04-29 11:26:52,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt. +39: [2023-04-29 11:26:52,512] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 315 +26: [2023-04-29 11:26:52,512] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +31: [2023-04-29 11:26:52,513] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 250 + 2: [2023-04-29 11:26:52,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 11:26:52,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 11:26:52,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 2: [2023-04-29 11:26:52,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +36: [2023-04-29 11:26:52,516] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt. +36: [2023-04-29 11:26:52,517] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 293 +26: [2023-04-29 11:26:52,518] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 1: [2023-04-29 11:26:52,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 1: [2023-04-29 11:26:52,519] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 1: [2023-04-29 11:26:52,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 1: [2023-04-29 11:26:52,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +29: [2023-04-29 11:26:52,520] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +26: [2023-04-29 11:26:52,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +26: [2023-04-29 11:26:52,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +42: [2023-04-29 11:26:52,521] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 11:26:52,522] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +42: [2023-04-29 11:26:52,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 11:26:52,522] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 11:26:52,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +42: [2023-04-29 11:26:52,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +42: [2023-04-29 11:26:52,523] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +42: [2023-04-29 11:26:52,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +42: [2023-04-29 11:26:52,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... + 2: [2023-04-29 11:26:52,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 2: [2023-04-29 11:26:52,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 2: [2023-04-29 11:26:52,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 2: [2023-04-29 11:26:52,523] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +36: [2023-04-29 11:26:52,523] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 293 +17: [2023-04-29 11:26:52,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt. +31: [2023-04-29 11:26:52,524] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt. +31: [2023-04-29 11:26:52,524] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 252 +17: [2023-04-29 11:26:52,524] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 136 +29: [2023-04-29 11:26:52,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 11:26:52,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt. +59: [2023-04-29 11:26:52,525] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt. +15: [2023-04-29 11:26:52,525] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 124 +59: [2023-04-29 11:26:52,525] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 473 +42: [2023-04-29 11:26:52,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +42: [2023-04-29 11:26:52,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +42: [2023-04-29 11:26:52,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +42: [2023-04-29 11:26:52,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +42: [2023-04-29 11:26:52,526] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +42: [2023-04-29 11:26:52,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +29: [2023-04-29 11:26:52,526] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +26: [2023-04-29 11:26:52,527] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +42: [2023-04-29 11:26:52,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +46: [2023-04-29 11:26:52,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt. +46: [2023-04-29 11:26:52,527] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 369 +59: [2023-04-29 11:26:52,527] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt. +59: [2023-04-29 11:26:52,528] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 477 +13: [2023-04-29 11:26:52,528] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +46: [2023-04-29 11:26:52,530] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt. +46: [2023-04-29 11:26:52,530] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 371 +29: [2023-04-29 11:26:52,531] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +29: [2023-04-29 11:26:52,532] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 3: [2023-04-29 11:26:52,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt... + 3: [2023-04-29 11:26:52,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt... + 3: [2023-04-29 11:26:52,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt... + 3: [2023-04-29 11:26:52,532] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt... +31: [2023-04-29 11:26:52,533] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 252 +13: [2023-04-29 11:26:52,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 11:26:52,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +15: [2023-04-29 11:26:52,533] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 124 +29: [2023-04-29 11:26:52,533] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +17: [2023-04-29 11:26:52,533] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 136 +46: [2023-04-29 11:26:52,534] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 369 +25: [2023-04-29 11:26:52,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +46: [2023-04-29 11:26:52,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt. +18: [2023-04-29 11:26:52,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +18: [2023-04-29 11:26:52,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +25: [2023-04-29 11:26:52,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +25: [2023-04-29 11:26:52,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +46: [2023-04-29 11:26:52,534] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 375 +18: [2023-04-29 11:26:52,534] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +25: [2023-04-29 11:26:52,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +18: [2023-04-29 11:26:52,535] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +23: [2023-04-29 11:26:52,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +23: [2023-04-29 11:26:52,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +23: [2023-04-29 11:26:52,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +15: [2023-04-29 11:26:52,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt... +23: [2023-04-29 11:26:52,536] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +13: [2023-04-29 11:26:52,536] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +15: [2023-04-29 11:26:52,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt... +15: [2023-04-29 11:26:52,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt... +15: [2023-04-29 11:26:52,537] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt... +13: [2023-04-29 11:26:52,537] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +46: [2023-04-29 11:26:52,539] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 371 +13: [2023-04-29 11:26:52,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +13: [2023-04-29 11:26:52,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +35: [2023-04-29 11:26:52,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 11:26:52,539] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +29: [2023-04-29 11:26:52,540] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +35: [2023-04-29 11:26:52,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 11:26:52,540] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +46: [2023-04-29 11:26:52,541] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 375 +47: [2023-04-29 11:26:52,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt... +47: [2023-04-29 11:26:52,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt... +47: [2023-04-29 11:26:52,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt... +47: [2023-04-29 11:26:52,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt... +35: [2023-04-29 11:26:52,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 11:26:52,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +35: [2023-04-29 11:26:52,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +35: [2023-04-29 11:26:52,541] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt... +35: [2023-04-29 11:26:52,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +35: [2023-04-29 11:26:52,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +35: [2023-04-29 11:26:52,542] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_00-model_states.pt. +29: [2023-04-29 11:26:52,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +35: [2023-04-29 11:26:52,542] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt... +13: [2023-04-29 11:26:52,544] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +35: [2023-04-29 11:26:52,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +35: [2023-04-29 11:26:52,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +35: [2023-04-29 11:26:52,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +35: [2023-04-29 11:26:52,545] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_46-model_01-model_states.pt. +15: [2023-04-29 11:26:52,546] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt. +15: [2023-04-29 11:26:52,546] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 126 + 5: [2023-04-29 11:26:52,548] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 11:26:52,549] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt. +13: [2023-04-29 11:26:52,549] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 108 +38: [2023-04-29 11:26:52,549] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 305 +38: [2023-04-29 11:26:52,551] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 311 +38: [2023-04-29 11:26:52,552] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 307 + 5: [2023-04-29 11:26:52,553] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +15: [2023-04-29 11:26:52,555] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 126 + 5: [2023-04-29 11:26:52,556] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +13: [2023-04-29 11:26:52,557] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 108 + 5: [2023-04-29 11:26:52,562] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +33: [2023-04-29 11:26:52,565] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 265 +14: [2023-04-29 11:26:52,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt... +14: [2023-04-29 11:26:52,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt... +14: [2023-04-29 11:26:52,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt... +14: [2023-04-29 11:26:52,566] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt... +33: [2023-04-29 11:26:52,566] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 267 + 5: [2023-04-29 11:26:52,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. + 5: [2023-04-29 11:26:52,567] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_00-model_states.pt. +33: [2023-04-29 11:26:52,567] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 271 +33: [2023-04-29 11:26:52,568] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 269 +42: [2023-04-29 11:26:52,569] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt... +42: [2023-04-29 11:26:52,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt... +42: [2023-04-29 11:26:52,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt... +42: [2023-04-29 11:26:52,570] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt... + 5: [2023-04-29 11:26:52,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... + 5: [2023-04-29 11:26:52,573] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt... +14: [2023-04-29 11:26:52,583] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt. +14: [2023-04-29 11:26:52,583] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 112 + 6: [2023-04-29 11:26:52,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt... + 6: [2023-04-29 11:26:52,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt... + 6: [2023-04-29 11:26:52,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt... + 6: [2023-04-29 11:26:52,584] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt... +21: [2023-04-29 11:26:52,584] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt. +21: [2023-04-29 11:26:52,584] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 174 + 1: [2023-04-29 11:26:52,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt... + 1: [2023-04-29 11:26:52,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt... + 1: [2023-04-29 11:26:52,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt... + 1: [2023-04-29 11:26:52,586] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt... + 9: [2023-04-29 11:26:52,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 9: [2023-04-29 11:26:52,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 9: [2023-04-29 11:26:52,586] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 9: [2023-04-29 11:26:52,587] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +30: [2023-04-29 11:26:52,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +30: [2023-04-29 11:26:52,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +30: [2023-04-29 11:26:52,588] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +30: [2023-04-29 11:26:52,590] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +14: [2023-04-29 11:26:52,591] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 112 +21: [2023-04-29 11:26:52,592] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 174 +35: [2023-04-29 11:26:52,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt... +35: [2023-04-29 11:26:52,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt... +35: [2023-04-29 11:26:52,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt... +35: [2023-04-29 11:26:52,594] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt... +20: [2023-04-29 11:26:52,595] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt. +20: [2023-04-29 11:26:52,595] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 164 +25: [2023-04-29 11:26:52,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt... +25: [2023-04-29 11:26:52,601] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt... +25: [2023-04-29 11:26:52,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt... +20: [2023-04-29 11:26:52,602] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 164 +25: [2023-04-29 11:26:52,602] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt... +23: [2023-04-29 11:26:52,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt... +23: [2023-04-29 11:26:52,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt... +23: [2023-04-29 11:26:52,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt... +23: [2023-04-29 11:26:52,607] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt... +38: [2023-04-29 11:26:52,609] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt. +38: [2023-04-29 11:26:52,609] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 309 +18: [2023-04-29 11:26:52,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt... +18: [2023-04-29 11:26:52,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt... +18: [2023-04-29 11:26:52,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt... +18: [2023-04-29 11:26:52,612] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt... +55: [2023-04-29 11:26:52,613] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt. +55: [2023-04-29 11:26:52,613] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 443 +20: [2023-04-29 11:26:52,614] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt. +20: [2023-04-29 11:26:52,615] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 166 +38: [2023-04-29 11:26:52,617] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 309 +62: [2023-04-29 11:26:52,617] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt. +62: [2023-04-29 11:26:52,617] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 499 +55: [2023-04-29 11:26:52,621] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 443 +20: [2023-04-29 11:26:52,622] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 166 +46: [2023-04-29 11:26:52,630] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt. +46: [2023-04-29 11:26:52,630] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 373 +30: [2023-04-29 11:26:52,637] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt. +62: [2023-04-29 11:26:52,637] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 497 +62: [2023-04-29 11:26:52,637] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 501 +30: [2023-04-29 11:26:52,637] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 240 +62: [2023-04-29 11:26:52,637] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 499 +46: [2023-04-29 11:26:52,639] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 373 +62: [2023-04-29 11:26:52,641] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 503 +30: [2023-04-29 11:26:52,645] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 240 + 8: [2023-04-29 11:26:52,649] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 8: [2023-04-29 11:26:52,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 8: [2023-04-29 11:26:52,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 8: [2023-04-29 11:26:52,650] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 9: [2023-04-29 11:26:52,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt... + 9: [2023-04-29 11:26:52,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt... + 9: [2023-04-29 11:26:52,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt... + 9: [2023-04-29 11:26:52,657] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt... +30: [2023-04-29 11:26:52,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt... +30: [2023-04-29 11:26:52,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt... +30: [2023-04-29 11:26:52,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt... +30: [2023-04-29 11:26:52,664] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt... +20: [2023-04-29 11:26:52,670] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +20: [2023-04-29 11:26:52,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +20: [2023-04-29 11:26:52,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +20: [2023-04-29 11:26:52,671] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +37: [2023-04-29 11:26:52,696] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt. +37: [2023-04-29 11:26:52,696] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 301 +28: [2023-04-29 11:26:52,701] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +28: [2023-04-29 11:26:52,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +28: [2023-04-29 11:26:52,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +28: [2023-04-29 11:26:52,702] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +36: [2023-04-29 11:26:52,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt. +41: [2023-04-29 11:26:52,705] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt. +36: [2023-04-29 11:26:52,705] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 295 +41: [2023-04-29 11:26:52,705] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 331 +41: [2023-04-29 11:26:52,708] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt. +41: [2023-04-29 11:26:52,708] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 335 +36: [2023-04-29 11:26:52,712] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 295 +41: [2023-04-29 11:26:52,714] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 331 +41: [2023-04-29 11:26:52,717] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 335 + 8: [2023-04-29 11:26:52,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt... + 8: [2023-04-29 11:26:52,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt... + 8: [2023-04-29 11:26:52,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt... + 8: [2023-04-29 11:26:52,723] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt... +48: [2023-04-29 11:26:52,731] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt. +48: [2023-04-29 11:26:52,731] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 391 + 8: [2023-04-29 11:26:52,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt. + 8: [2023-04-29 11:26:52,737] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 68 +24: [2023-04-29 11:26:52,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +24: [2023-04-29 11:26:52,737] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +24: [2023-04-29 11:26:52,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +24: [2023-04-29 11:26:52,738] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +60: [2023-04-29 11:26:52,743] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 481 +20: [2023-04-29 11:26:52,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt... +20: [2023-04-29 11:26:52,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt... +20: [2023-04-29 11:26:52,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt... + 8: [2023-04-29 11:26:52,744] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 68 +20: [2023-04-29 11:26:52,744] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt... +60: [2023-04-29 11:26:52,747] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 483 +34: [2023-04-29 11:26:52,748] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt. +34: [2023-04-29 11:26:52,748] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 279 +60: [2023-04-29 11:26:52,749] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 487 + 7: [2023-04-29 11:26:52,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 7: [2023-04-29 11:26:52,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 7: [2023-04-29 11:26:52,749] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 7: [2023-04-29 11:26:52,750] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +37: [2023-04-29 11:26:52,751] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt. +37: [2023-04-29 11:26:52,751] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 303 +60: [2023-04-29 11:26:52,751] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 485 +45: [2023-04-29 11:26:52,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt. +56: [2023-04-29 11:26:52,754] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt. +45: [2023-04-29 11:26:52,754] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 361 +56: [2023-04-29 11:26:52,754] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 451 +34: [2023-04-29 11:26:52,758] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt. +34: [2023-04-29 11:26:52,759] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 273 +26: [2023-04-29 11:26:52,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +26: [2023-04-29 11:26:52,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +31: [2023-04-29 11:26:52,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +31: [2023-04-29 11:26:52,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +31: [2023-04-29 11:26:52,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +26: [2023-04-29 11:26:52,760] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +31: [2023-04-29 11:26:52,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +26: [2023-04-29 11:26:52,761] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +37: [2023-04-29 11:26:52,763] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt. +37: [2023-04-29 11:26:52,763] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 299 +41: [2023-04-29 11:26:52,769] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt. +41: [2023-04-29 11:26:52,770] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 329 +28: [2023-04-29 11:26:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt... +28: [2023-04-29 11:26:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt... +28: [2023-04-29 11:26:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt... +28: [2023-04-29 11:26:52,770] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt... +21: [2023-04-29 11:26:52,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +21: [2023-04-29 11:26:52,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +21: [2023-04-29 11:26:52,771] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +21: [2023-04-29 11:26:52,772] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +27: [2023-04-29 11:26:52,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +27: [2023-04-29 11:26:52,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +27: [2023-04-29 11:26:52,774] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +27: [2023-04-29 11:26:52,775] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +41: [2023-04-29 11:26:52,777] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 329 +19: [2023-04-29 11:26:52,778] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt. +19: [2023-04-29 11:26:52,778] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 157 +53: [2023-04-29 11:26:52,785] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt. +53: [2023-04-29 11:26:52,785] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 429 +19: [2023-04-29 11:26:52,786] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 157 +55: [2023-04-29 11:26:52,787] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt. +55: [2023-04-29 11:26:52,787] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 445 +56: [2023-04-29 11:26:52,788] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 451 +39: [2023-04-29 11:26:52,792] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 319 +55: [2023-04-29 11:26:52,794] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 445 +39: [2023-04-29 11:26:52,794] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 313 +39: [2023-04-29 11:26:52,802] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 317 +22: [2023-04-29 11:26:52,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +22: [2023-04-29 11:26:52,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +22: [2023-04-29 11:26:52,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +22: [2023-04-29 11:26:52,803] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +39: [2023-04-29 11:26:52,804] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 315 +63: [2023-04-29 11:26:52,805] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 511 +16: [2023-04-29 11:26:52,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +16: [2023-04-29 11:26:52,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +16: [2023-04-29 11:26:52,805] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +58: [2023-04-29 11:26:52,805] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 469 +16: [2023-04-29 11:26:52,806] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +24: [2023-04-29 11:26:52,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt... +24: [2023-04-29 11:26:52,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt... +24: [2023-04-29 11:26:52,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt... +24: [2023-04-29 11:26:52,807] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt... + 2: [2023-04-29 11:26:52,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 2: [2023-04-29 11:26:52,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 2: [2023-04-29 11:26:52,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +10: [2023-04-29 11:26:52,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt. + 2: [2023-04-29 11:26:52,807] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +10: [2023-04-29 11:26:52,807] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 85 +63: [2023-04-29 11:26:52,809] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 509 +10: [2023-04-29 11:26:52,809] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt. +10: [2023-04-29 11:26:52,809] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 87 +58: [2023-04-29 11:26:52,810] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 471 +63: [2023-04-29 11:26:52,810] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 505 +58: [2023-04-29 11:26:52,812] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 467 +10: [2023-04-29 11:26:52,814] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 85 + 5: [2023-04-29 11:26:52,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 5: [2023-04-29 11:26:52,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 5: [2023-04-29 11:26:52,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. + 5: [2023-04-29 11:26:52,814] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +58: [2023-04-29 11:26:52,815] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 465 +63: [2023-04-29 11:26:52,815] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 507 +10: [2023-04-29 11:26:52,817] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 87 + 7: [2023-04-29 11:26:52,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt... + 7: [2023-04-29 11:26:52,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt... + 7: [2023-04-29 11:26:52,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt... + 7: [2023-04-29 11:26:52,818] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt... +59: [2023-04-29 11:26:52,819] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 473 +55: [2023-04-29 11:26:52,820] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt. +59: [2023-04-29 11:26:52,821] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 479 +55: [2023-04-29 11:26:52,821] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 441 +59: [2023-04-29 11:26:52,821] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 475 +59: [2023-04-29 11:26:52,821] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 477 +20: [2023-04-29 11:26:52,823] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt. +20: [2023-04-29 11:26:52,823] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 160 +53: [2023-04-29 11:26:52,825] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 429 +31: [2023-04-29 11:26:52,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt... +31: [2023-04-29 11:26:52,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt... +31: [2023-04-29 11:26:52,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt... +31: [2023-04-29 11:26:52,827] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt... +10: [2023-04-29 11:26:52,828] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt. +10: [2023-04-29 11:26:52,828] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 81 +26: [2023-04-29 11:26:52,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt... +26: [2023-04-29 11:26:52,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt... +26: [2023-04-29 11:26:52,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt... +26: [2023-04-29 11:26:52,828] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt... +55: [2023-04-29 11:26:52,829] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 441 +20: [2023-04-29 11:26:52,832] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 160 +55: [2023-04-29 11:26:52,835] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt. +55: [2023-04-29 11:26:52,835] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 447 +10: [2023-04-29 11:26:52,836] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 81 +29: [2023-04-29 11:26:52,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +29: [2023-04-29 11:26:52,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +29: [2023-04-29 11:26:52,837] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +29: [2023-04-29 11:26:52,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +10: [2023-04-29 11:26:52,838] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt. +10: [2023-04-29 11:26:52,838] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 83 +55: [2023-04-29 11:26:52,843] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 447 +48: [2023-04-29 11:26:52,843] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt. +48: [2023-04-29 11:26:52,844] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 385 +10: [2023-04-29 11:26:52,846] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 83 +54: [2023-04-29 11:26:52,847] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 433 +54: [2023-04-29 11:26:52,848] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 439 +27: [2023-04-29 11:26:52,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt... +27: [2023-04-29 11:26:52,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt... +27: [2023-04-29 11:26:52,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt... +27: [2023-04-29 11:26:52,848] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt... +21: [2023-04-29 11:26:52,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt... +21: [2023-04-29 11:26:52,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt... +21: [2023-04-29 11:26:52,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt... +21: [2023-04-29 11:26:52,849] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt... +48: [2023-04-29 11:26:52,855] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 391 +54: [2023-04-29 11:26:52,855] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 437 +44: [2023-04-29 11:26:52,855] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt. +44: [2023-04-29 11:26:52,856] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 355 +48: [2023-04-29 11:26:52,856] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 385 +34: [2023-04-29 11:26:52,856] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 273 +44: [2023-04-29 11:26:52,857] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt. +44: [2023-04-29 11:26:52,857] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 357 +54: [2023-04-29 11:26:52,858] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 435 +37: [2023-04-29 11:26:52,858] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 303 +34: [2023-04-29 11:26:52,858] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 279 +17: [2023-04-29 11:26:52,860] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt. +17: [2023-04-29 11:26:52,860] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 141 +53: [2023-04-29 11:26:52,861] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt. +53: [2023-04-29 11:26:52,861] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 425 +34: [2023-04-29 11:26:52,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt. +61: [2023-04-29 11:26:52,862] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt. +61: [2023-04-29 11:26:52,862] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 493 +34: [2023-04-29 11:26:52,862] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 275 +44: [2023-04-29 11:26:52,863] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 355 +57: [2023-04-29 11:26:52,863] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt. +57: [2023-04-29 11:26:52,863] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 463 +37: [2023-04-29 11:26:52,864] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 299 +37: [2023-04-29 11:26:52,865] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 301 +44: [2023-04-29 11:26:52,865] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 357 +17: [2023-04-29 11:26:52,867] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 141 +34: [2023-04-29 11:26:52,867] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt. +34: [2023-04-29 11:26:52,867] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 277 +53: [2023-04-29 11:26:52,868] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 425 +34: [2023-04-29 11:26:52,869] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 275 +57: [2023-04-29 11:26:52,870] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 463 +16: [2023-04-29 11:26:52,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt... +16: [2023-04-29 11:26:52,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt... +16: [2023-04-29 11:26:52,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt... +16: [2023-04-29 11:26:52,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt... +44: [2023-04-29 11:26:52,874] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt. +22: [2023-04-29 11:26:52,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt... +22: [2023-04-29 11:26:52,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt... +22: [2023-04-29 11:26:52,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt... +22: [2023-04-29 11:26:52,874] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt... +44: [2023-04-29 11:26:52,874] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 359 +12: [2023-04-29 11:26:52,875] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt. +12: [2023-04-29 11:26:52,875] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 99 +34: [2023-04-29 11:26:52,875] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 277 +45: [2023-04-29 11:26:52,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt. +45: [2023-04-29 11:26:52,881] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 363 +19: [2023-04-29 11:26:52,881] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt. +19: [2023-04-29 11:26:52,881] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 153 +12: [2023-04-29 11:26:52,882] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 99 +44: [2023-04-29 11:26:52,883] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 359 + 2: [2023-04-29 11:26:52,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt... + 2: [2023-04-29 11:26:52,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt... + 2: [2023-04-29 11:26:52,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt... + 2: [2023-04-29 11:26:52,885] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt... +57: [2023-04-29 11:26:52,885] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt. +57: [2023-04-29 11:26:52,885] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 459 +19: [2023-04-29 11:26:52,886] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt. +19: [2023-04-29 11:26:52,887] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 159 + 5: [2023-04-29 11:26:52,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt... + 5: [2023-04-29 11:26:52,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt... + 5: [2023-04-29 11:26:52,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt... + 5: [2023-04-29 11:26:52,886] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt... +13: [2023-04-29 11:26:52,888] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +13: [2023-04-29 11:26:52,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +13: [2023-04-29 11:26:52,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +13: [2023-04-29 11:26:52,889] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/layer_23-model_01-model_states.pt. +19: [2023-04-29 11:26:52,890] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 153 +61: [2023-04-29 11:26:52,891] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 493 +52: [2023-04-29 11:26:52,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt. +52: [2023-04-29 11:26:52,892] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 423 +57: [2023-04-29 11:26:52,892] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 459 +53: [2023-04-29 11:26:52,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt. +61: [2023-04-29 11:26:52,892] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt. +53: [2023-04-29 11:26:52,892] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 431 +61: [2023-04-29 11:26:52,892] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 491 +19: [2023-04-29 11:26:52,893] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 159 +40: [2023-04-29 11:26:52,899] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt. +40: [2023-04-29 11:26:52,899] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 323 +52: [2023-04-29 11:26:52,899] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 423 +61: [2023-04-29 11:26:52,900] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 491 +53: [2023-04-29 11:26:52,901] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 431 +45: [2023-04-29 11:26:52,903] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt. +45: [2023-04-29 11:26:52,903] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 367 + 4: [2023-04-29 11:26:52,906] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt. + 4: [2023-04-29 11:26:52,906] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 33 +40: [2023-04-29 11:26:52,906] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 323 +61: [2023-04-29 11:26:52,910] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt. +61: [2023-04-29 11:26:52,910] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 495 +29: [2023-04-29 11:26:52,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt... +29: [2023-04-29 11:26:52,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt... +29: [2023-04-29 11:26:52,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt... +29: [2023-04-29 11:26:52,911] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt... +40: [2023-04-29 11:26:52,911] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt. +40: [2023-04-29 11:26:52,911] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 325 +50: [2023-04-29 11:26:52,912] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt. +50: [2023-04-29 11:26:52,912] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 403 + 4: [2023-04-29 11:26:52,913] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 33 +17: [2023-04-29 11:26:52,915] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt. +17: [2023-04-29 11:26:52,915] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 137 +57: [2023-04-29 11:26:52,918] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt. +57: [2023-04-29 11:26:52,918] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 457 +61: [2023-04-29 11:26:52,918] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 495 +40: [2023-04-29 11:26:52,918] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 325 +50: [2023-04-29 11:26:52,918] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 403 +48: [2023-04-29 11:26:52,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt. + 0: [2023-04-29 11:26:52,919] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt. +48: [2023-04-29 11:26:52,919] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 389 + 0: [2023-04-29 11:26:52,920] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 1 +15: [2023-04-29 11:26:52,920] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt. +15: [2023-04-29 11:26:52,920] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 127 +17: [2023-04-29 11:26:52,922] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 137 +15: [2023-04-29 11:26:52,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt. + 4: [2023-04-29 11:26:52,923] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt. +15: [2023-04-29 11:26:52,923] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 121 + 4: [2023-04-29 11:26:52,923] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 37 +40: [2023-04-29 11:26:52,925] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt. +40: [2023-04-29 11:26:52,926] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 321 + 0: [2023-04-29 11:26:52,926] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 1 +48: [2023-04-29 11:26:52,927] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 389 +57: [2023-04-29 11:26:52,928] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 457 +15: [2023-04-29 11:26:52,928] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 127 + 0: [2023-04-29 11:26:52,928] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt. + 0: [2023-04-29 11:26:52,928] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 7 +52: [2023-04-29 11:26:52,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt. +50: [2023-04-29 11:26:52,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt. +52: [2023-04-29 11:26:52,929] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 421 +50: [2023-04-29 11:26:52,929] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 405 +40: [2023-04-29 11:26:52,929] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt. +40: [2023-04-29 11:26:52,930] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 327 + 0: [2023-04-29 11:26:52,930] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt. + 0: [2023-04-29 11:26:52,930] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 3 + 4: [2023-04-29 11:26:52,931] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 37 +15: [2023-04-29 11:26:52,932] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 121 +21: [2023-04-29 11:26:52,932] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt. +21: [2023-04-29 11:26:52,932] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 172 +40: [2023-04-29 11:26:52,933] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 321 +53: [2023-04-29 11:26:52,934] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt. +53: [2023-04-29 11:26:52,934] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 427 +52: [2023-04-29 11:26:52,936] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 421 +50: [2023-04-29 11:26:52,937] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 405 + 0: [2023-04-29 11:26:52,937] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 7 +40: [2023-04-29 11:26:52,937] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 327 +45: [2023-04-29 11:26:52,939] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 363 + 0: [2023-04-29 11:26:52,939] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 3 +21: [2023-04-29 11:26:52,939] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 172 +45: [2023-04-29 11:26:52,941] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 367 +53: [2023-04-29 11:26:52,942] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 427 +45: [2023-04-29 11:26:52,945] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 361 +37: [2023-04-29 11:26:52,947] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt. +37: [2023-04-29 11:26:52,947] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 297 +12: [2023-04-29 11:26:52,952] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt. +12: [2023-04-29 11:26:52,952] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 101 + 3: [2023-04-29 11:26:52,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt. +56: [2023-04-29 11:26:52,954] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt. +56: [2023-04-29 11:26:52,954] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 453 + 3: [2023-04-29 11:26:52,954] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 31 +61: [2023-04-29 11:26:52,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt. +61: [2023-04-29 11:26:52,955] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 489 +18: [2023-04-29 11:26:52,955] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt. +18: [2023-04-29 11:26:52,956] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 149 +37: [2023-04-29 11:26:52,957] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 297 + 3: [2023-04-29 11:26:52,960] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 31 +44: [2023-04-29 11:26:52,960] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt. +44: [2023-04-29 11:26:52,961] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 353 +12: [2023-04-29 11:26:52,961] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 101 +56: [2023-04-29 11:26:52,962] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 453 +18: [2023-04-29 11:26:52,964] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 149 +14: [2023-04-29 11:26:52,964] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt. +14: [2023-04-29 11:26:52,964] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 119 +12: [2023-04-29 11:26:52,966] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt. +12: [2023-04-29 11:26:52,966] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 103 +61: [2023-04-29 11:26:52,966] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 489 +44: [2023-04-29 11:26:52,967] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 353 +45: [2023-04-29 11:26:52,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt. +47: [2023-04-29 11:26:52,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt. +56: [2023-04-29 11:26:52,971] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt. +45: [2023-04-29 11:26:52,971] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 365 +56: [2023-04-29 11:26:52,971] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 449 +47: [2023-04-29 11:26:52,971] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 377 +13: [2023-04-29 11:26:52,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt... +14: [2023-04-29 11:26:52,972] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 119 +13: [2023-04-29 11:26:52,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt... +13: [2023-04-29 11:26:52,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt... +13: [2023-04-29 11:26:52,972] [INFO] [torch_checkpoint_engine.py:21:load] [Torch] Loading checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt... +12: [2023-04-29 11:26:52,972] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 103 +11: [2023-04-29 11:26:52,975] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt. +11: [2023-04-29 11:26:52,975] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 89 +25: [2023-04-29 11:26:52,977] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt. +25: [2023-04-29 11:26:52,977] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 205 +47: [2023-04-29 11:26:52,978] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 377 +56: [2023-04-29 11:26:52,978] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 449 +45: [2023-04-29 11:26:52,979] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 365 +11: [2023-04-29 11:26:52,981] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 89 +25: [2023-04-29 11:26:52,985] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 205 +35: [2023-04-29 11:26:52,985] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt. +35: [2023-04-29 11:26:52,986] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 283 + 3: [2023-04-29 11:26:52,990] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt. + 3: [2023-04-29 11:26:52,990] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 29 +41: [2023-04-29 11:26:52,992] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt. +41: [2023-04-29 11:26:52,993] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 333 +35: [2023-04-29 11:26:52,993] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 283 + 4: [2023-04-29 11:26:52,994] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt. + 4: [2023-04-29 11:26:52,994] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 35 +18: [2023-04-29 11:26:52,996] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt. +18: [2023-04-29 11:26:52,997] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 151 + 3: [2023-04-29 11:26:52,998] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 29 +42: [2023-04-29 11:26:52,998] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt. +42: [2023-04-29 11:26:52,998] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 339 +41: [2023-04-29 11:26:53,000] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 333 + 4: [2023-04-29 11:26:53,002] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 35 +50: [2023-04-29 11:26:53,003] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt. +50: [2023-04-29 11:26:53,003] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 407 +42: [2023-04-29 11:26:53,006] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 339 +18: [2023-04-29 11:26:53,006] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 151 + 0: [2023-04-29 11:26:53,007] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt. + 0: [2023-04-29 11:26:53,008] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 5 +57: [2023-04-29 11:26:53,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt. +57: [2023-04-29 11:26:53,008] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 461 +11: [2023-04-29 11:26:53,008] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt. +11: [2023-04-29 11:26:53,009] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 95 + 6: [2023-04-29 11:26:53,009] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt. + 6: [2023-04-29 11:26:53,009] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 51 +14: [2023-04-29 11:26:53,010] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt. +14: [2023-04-29 11:26:53,010] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 113 +35: [2023-04-29 11:26:53,011] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt. +35: [2023-04-29 11:26:53,011] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 281 +50: [2023-04-29 11:26:53,012] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 407 + 3: [2023-04-29 11:26:53,014] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt. + 3: [2023-04-29 11:26:53,014] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 25 +50: [2023-04-29 11:26:53,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt. +50: [2023-04-29 11:26:53,015] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 401 +23: [2023-04-29 11:26:53,015] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt. +23: [2023-04-29 11:26:53,016] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 191 +57: [2023-04-29 11:26:53,017] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 461 +11: [2023-04-29 11:26:53,017] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 95 +14: [2023-04-29 11:26:53,017] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 113 + 0: [2023-04-29 11:26:53,017] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 5 + 6: [2023-04-29 11:26:53,017] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 51 + 1: [2023-04-29 11:26:53,017] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt. + 1: [2023-04-29 11:26:53,018] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 9 +42: [2023-04-29 11:26:53,018] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt. +42: [2023-04-29 11:26:53,019] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 341 +52: [2023-04-29 11:26:53,019] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt. +52: [2023-04-29 11:26:53,019] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 419 +35: [2023-04-29 11:26:53,020] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 281 +15: [2023-04-29 11:26:53,021] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt. +15: [2023-04-29 11:26:53,021] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 125 + 3: [2023-04-29 11:26:53,022] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 25 +50: [2023-04-29 11:26:53,022] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 401 +14: [2023-04-29 11:26:53,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt. +14: [2023-04-29 11:26:53,024] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 117 +12: [2023-04-29 11:26:53,024] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt. +23: [2023-04-29 11:26:53,024] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 191 + 1: [2023-04-29 11:26:53,025] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 9 +12: [2023-04-29 11:26:53,025] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 97 +42: [2023-04-29 11:26:53,026] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 341 +52: [2023-04-29 11:26:53,027] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 419 +23: [2023-04-29 11:26:53,028] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt. +23: [2023-04-29 11:26:53,028] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 185 +15: [2023-04-29 11:26:53,029] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 125 +14: [2023-04-29 11:26:53,031] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 117 +12: [2023-04-29 11:26:53,031] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 97 + 6: [2023-04-29 11:26:53,032] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt. + 6: [2023-04-29 11:26:53,033] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 55 + 3: [2023-04-29 11:26:53,033] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt. + 3: [2023-04-29 11:26:53,033] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 27 +23: [2023-04-29 11:26:53,035] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 185 +48: [2023-04-29 11:26:53,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt. +23: [2023-04-29 11:26:53,035] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt. +48: [2023-04-29 11:26:53,035] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 387 +23: [2023-04-29 11:26:53,035] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 187 + 3: [2023-04-29 11:26:53,039] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 27 + 6: [2023-04-29 11:26:53,041] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 55 +42: [2023-04-29 11:26:53,041] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt. +23: [2023-04-29 11:26:53,041] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 187 +48: [2023-04-29 11:26:53,042] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 387 +42: [2023-04-29 11:26:53,042] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 343 +17: [2023-04-29 11:26:53,048] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt. +17: [2023-04-29 11:26:53,048] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 143 +42: [2023-04-29 11:26:53,049] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 343 +35: [2023-04-29 11:26:53,051] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt. +35: [2023-04-29 11:26:53,051] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 285 + 6: [2023-04-29 11:26:53,054] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt. + 6: [2023-04-29 11:26:53,055] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 49 +17: [2023-04-29 11:26:53,057] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 143 +47: [2023-04-29 11:26:53,059] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt. +47: [2023-04-29 11:26:53,060] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 381 +35: [2023-04-29 11:26:53,060] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 285 +47: [2023-04-29 11:26:53,060] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt. +47: [2023-04-29 11:26:53,060] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 379 + 6: [2023-04-29 11:26:53,062] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 49 + 9: [2023-04-29 11:26:53,063] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt. + 9: [2023-04-29 11:26:53,063] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 77 +42: [2023-04-29 11:26:53,064] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt. +42: [2023-04-29 11:26:53,064] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 337 +47: [2023-04-29 11:26:53,066] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 381 +47: [2023-04-29 11:26:53,068] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 379 + 9: [2023-04-29 11:26:53,070] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 77 +42: [2023-04-29 11:26:53,072] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 337 + 6: [2023-04-29 11:26:53,072] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt. + 6: [2023-04-29 11:26:53,072] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 53 +14: [2023-04-29 11:26:53,074] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt. +14: [2023-04-29 11:26:53,074] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 115 + 6: [2023-04-29 11:26:53,080] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 53 +14: [2023-04-29 11:26:53,081] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 115 + 9: [2023-04-29 11:26:53,082] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt. + 9: [2023-04-29 11:26:53,082] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 79 + 1: [2023-04-29 11:26:53,083] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt. + 1: [2023-04-29 11:26:53,083] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 11 +25: [2023-04-29 11:26:53,087] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt. +25: [2023-04-29 11:26:53,087] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 203 + 1: [2023-04-29 11:26:53,090] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 11 + 9: [2023-04-29 11:26:53,092] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 79 +25: [2023-04-29 11:26:53,094] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 203 +30: [2023-04-29 11:26:53,099] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt. +30: [2023-04-29 11:26:53,099] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 243 +30: [2023-04-29 11:26:53,106] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 243 +19: [2023-04-29 11:26:53,109] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt. +19: [2023-04-29 11:26:53,109] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 155 +17: [2023-04-29 11:26:53,114] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt. +17: [2023-04-29 11:26:53,115] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 139 +19: [2023-04-29 11:26:53,115] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 155 + 9: [2023-04-29 11:26:53,118] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt. + 9: [2023-04-29 11:26:53,119] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 73 +17: [2023-04-29 11:26:53,122] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 139 + 9: [2023-04-29 11:26:53,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt. +20: [2023-04-29 11:26:53,122] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt. +20: [2023-04-29 11:26:53,123] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 163 + 9: [2023-04-29 11:26:53,123] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 75 + 9: [2023-04-29 11:26:53,125] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 73 +20: [2023-04-29 11:26:53,130] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 163 + 9: [2023-04-29 11:26:53,131] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 75 +28: [2023-04-29 11:26:53,132] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt. +28: [2023-04-29 11:26:53,132] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 227 +28: [2023-04-29 11:26:53,140] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 227 +20: [2023-04-29 11:26:53,141] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt. +20: [2023-04-29 11:26:53,141] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 161 +20: [2023-04-29 11:26:53,148] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 161 +56: [2023-04-29 11:26:53,150] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt. +56: [2023-04-29 11:26:53,150] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 455 +47: [2023-04-29 11:26:53,152] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt. +47: [2023-04-29 11:26:53,152] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 383 +11: [2023-04-29 11:26:53,159] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt. +47: [2023-04-29 11:26:53,159] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 383 +11: [2023-04-29 11:26:53,159] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 91 +56: [2023-04-29 11:26:53,159] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 455 +15: [2023-04-29 11:26:53,160] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt. +15: [2023-04-29 11:26:53,161] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 123 +11: [2023-04-29 11:26:53,168] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 91 +15: [2023-04-29 11:26:53,170] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 123 +30: [2023-04-29 11:26:53,172] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt. +30: [2023-04-29 11:26:53,172] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 241 +35: [2023-04-29 11:26:53,174] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt. +35: [2023-04-29 11:26:53,174] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 287 +30: [2023-04-29 11:26:53,180] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 241 +23: [2023-04-29 11:26:53,180] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt. +23: [2023-04-29 11:26:53,180] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 189 + 8: [2023-04-29 11:26:53,181] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt. + 8: [2023-04-29 11:26:53,181] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 65 +35: [2023-04-29 11:26:53,185] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 287 +25: [2023-04-29 11:26:53,185] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt. +25: [2023-04-29 11:26:53,185] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 201 +23: [2023-04-29 11:26:53,187] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 189 +20: [2023-04-29 11:26:53,188] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt. +20: [2023-04-29 11:26:53,189] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 167 + 8: [2023-04-29 11:26:53,190] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt. + 8: [2023-04-29 11:26:53,191] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 71 + 8: [2023-04-29 11:26:53,191] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 65 +25: [2023-04-29 11:26:53,193] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 201 +20: [2023-04-29 11:26:53,197] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 167 + 8: [2023-04-29 11:26:53,198] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 71 + 1: [2023-04-29 11:26:53,198] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt. + 1: [2023-04-29 11:26:53,199] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 15 +30: [2023-04-29 11:26:53,199] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt. +30: [2023-04-29 11:26:53,200] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 245 +24: [2023-04-29 11:26:53,204] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt. +24: [2023-04-29 11:26:53,204] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 193 + 1: [2023-04-29 11:26:53,206] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 15 +30: [2023-04-29 11:26:53,206] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 245 +31: [2023-04-29 11:26:53,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt. +31: [2023-04-29 11:26:53,207] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 251 +28: [2023-04-29 11:26:53,207] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt. +28: [2023-04-29 11:26:53,207] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 225 +24: [2023-04-29 11:26:53,211] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 193 +28: [2023-04-29 11:26:53,214] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 225 +31: [2023-04-29 11:26:53,214] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 251 + 8: [2023-04-29 11:26:53,217] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt. + 8: [2023-04-29 11:26:53,218] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 67 + 7: [2023-04-29 11:26:53,219] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt. + 7: [2023-04-29 11:26:53,220] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 59 + 2: [2023-04-29 11:26:53,220] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt. + 2: [2023-04-29 11:26:53,221] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 17 +28: [2023-04-29 11:26:53,221] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt. +28: [2023-04-29 11:26:53,221] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 231 + 8: [2023-04-29 11:26:53,224] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 67 +22: [2023-04-29 11:26:53,227] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt. +28: [2023-04-29 11:26:53,227] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 231 +22: [2023-04-29 11:26:53,228] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 183 + 2: [2023-04-29 11:26:53,228] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 17 + 7: [2023-04-29 11:26:53,228] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 59 +31: [2023-04-29 11:26:53,232] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt. +31: [2023-04-29 11:26:53,232] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 255 +22: [2023-04-29 11:26:53,235] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 183 +24: [2023-04-29 11:26:53,238] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt. +24: [2023-04-29 11:26:53,238] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 199 +31: [2023-04-29 11:26:53,239] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 255 +21: [2023-04-29 11:26:53,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt. +21: [2023-04-29 11:26:53,245] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 169 + 7: [2023-04-29 11:26:53,245] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt. + 7: [2023-04-29 11:26:53,246] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 61 +24: [2023-04-29 11:26:53,246] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 199 +26: [2023-04-29 11:26:53,247] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt. +26: [2023-04-29 11:26:53,247] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 215 +24: [2023-04-29 11:26:53,248] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt. +24: [2023-04-29 11:26:53,249] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 195 +21: [2023-04-29 11:26:53,252] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 169 +31: [2023-04-29 11:26:53,252] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt. +31: [2023-04-29 11:26:53,252] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 249 +26: [2023-04-29 11:26:53,255] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 215 +24: [2023-04-29 11:26:53,256] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 195 + 7: [2023-04-29 11:26:53,257] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 61 + 4: [2023-04-29 11:26:53,260] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt. +31: [2023-04-29 11:26:53,260] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 249 + 4: [2023-04-29 11:26:53,261] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 39 +26: [2023-04-29 11:26:53,261] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt. +26: [2023-04-29 11:26:53,261] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 209 + 4: [2023-04-29 11:26:53,268] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 39 +26: [2023-04-29 11:26:53,269] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 209 +26: [2023-04-29 11:26:53,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt. +30: [2023-04-29 11:26:53,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt. + 2: [2023-04-29 11:26:53,270] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt. +30: [2023-04-29 11:26:53,270] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 247 +26: [2023-04-29 11:26:53,270] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 211 + 2: [2023-04-29 11:26:53,271] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 21 +22: [2023-04-29 11:26:53,272] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt. +22: [2023-04-29 11:26:53,272] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 179 +24: [2023-04-29 11:26:53,275] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt. +24: [2023-04-29 11:26:53,275] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 197 +52: [2023-04-29 11:26:53,277] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt. +52: [2023-04-29 11:26:53,277] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 417 +30: [2023-04-29 11:26:53,278] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 247 +26: [2023-04-29 11:26:53,278] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 211 + 2: [2023-04-29 11:26:53,279] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 21 +22: [2023-04-29 11:26:53,280] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 179 + 5: [2023-04-29 11:26:53,280] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt. + 5: [2023-04-29 11:26:53,280] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 47 +27: [2023-04-29 11:26:53,281] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt. +27: [2023-04-29 11:26:53,281] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 217 + 1: [2023-04-29 11:26:53,282] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt. + 1: [2023-04-29 11:26:53,282] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 13 +24: [2023-04-29 11:26:53,283] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 197 +27: [2023-04-29 11:26:53,283] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt. +27: [2023-04-29 11:26:53,283] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 223 +52: [2023-04-29 11:26:53,284] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 417 +20: [2023-04-29 11:26:53,285] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt. +20: [2023-04-29 11:26:53,285] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 165 + 5: [2023-04-29 11:26:53,287] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 47 +27: [2023-04-29 11:26:53,288] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 217 + 1: [2023-04-29 11:26:53,289] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 13 +27: [2023-04-29 11:26:53,290] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 223 +20: [2023-04-29 11:26:53,291] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 165 +18: [2023-04-29 11:26:53,291] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt. +18: [2023-04-29 11:26:53,292] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 145 +29: [2023-04-29 11:26:53,296] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt. +29: [2023-04-29 11:26:53,296] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 235 +11: [2023-04-29 11:26:53,298] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt. +11: [2023-04-29 11:26:53,298] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 93 +18: [2023-04-29 11:26:53,299] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 145 +29: [2023-04-29 11:26:53,303] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 235 +26: [2023-04-29 11:26:53,305] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt. +26: [2023-04-29 11:26:53,305] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 213 +27: [2023-04-29 11:26:53,307] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt. +27: [2023-04-29 11:26:53,307] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 221 +11: [2023-04-29 11:26:53,307] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 93 +26: [2023-04-29 11:26:53,311] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 213 +16: [2023-04-29 11:26:53,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt. +16: [2023-04-29 11:26:53,312] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 133 + 2: [2023-04-29 11:26:53,312] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt. + 2: [2023-04-29 11:26:53,313] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 19 +27: [2023-04-29 11:26:53,314] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 221 + 5: [2023-04-29 11:26:53,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt. +16: [2023-04-29 11:26:53,317] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt. + 5: [2023-04-29 11:26:53,317] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 45 +16: [2023-04-29 11:26:53,317] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 129 +21: [2023-04-29 11:26:53,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt. +16: [2023-04-29 11:26:53,319] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 133 +21: [2023-04-29 11:26:53,320] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 175 +16: [2023-04-29 11:26:53,320] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt. +16: [2023-04-29 11:26:53,321] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 135 + 2: [2023-04-29 11:26:53,321] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 19 + 5: [2023-04-29 11:26:53,324] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 45 +16: [2023-04-29 11:26:53,325] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 129 +21: [2023-04-29 11:26:53,326] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 175 +16: [2023-04-29 11:26:53,329] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 135 +28: [2023-04-29 11:26:53,332] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt. +28: [2023-04-29 11:26:53,332] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 229 +16: [2023-04-29 11:26:53,334] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt. +16: [2023-04-29 11:26:53,334] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 131 +18: [2023-04-29 11:26:53,336] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt. +18: [2023-04-29 11:26:53,336] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 147 +29: [2023-04-29 11:26:53,338] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt. +29: [2023-04-29 11:26:53,338] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 239 +21: [2023-04-29 11:26:53,340] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt. +21: [2023-04-29 11:26:53,340] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 171 +16: [2023-04-29 11:26:53,342] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 131 +28: [2023-04-29 11:26:53,342] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 229 +18: [2023-04-29 11:26:53,343] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 147 + 5: [2023-04-29 11:26:53,344] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt. + 5: [2023-04-29 11:26:53,344] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 41 +29: [2023-04-29 11:26:53,346] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 239 +21: [2023-04-29 11:26:53,348] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 171 + 5: [2023-04-29 11:26:53,352] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 41 + 5: [2023-04-29 11:26:53,354] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt. + 5: [2023-04-29 11:26:53,355] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 43 + 5: [2023-04-29 11:26:53,362] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 43 +29: [2023-04-29 11:26:53,367] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt. +29: [2023-04-29 11:26:53,367] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 237 +29: [2023-04-29 11:26:53,374] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 237 +25: [2023-04-29 11:26:53,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt. +25: [2023-04-29 11:26:53,377] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 207 + 7: [2023-04-29 11:26:53,377] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt. + 7: [2023-04-29 11:26:53,378] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 63 + 7: [2023-04-29 11:26:53,385] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 63 +25: [2023-04-29 11:26:53,385] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 207 +27: [2023-04-29 11:26:53,394] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt. +27: [2023-04-29 11:26:53,394] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 219 +22: [2023-04-29 11:26:53,397] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt. +22: [2023-04-29 11:26:53,397] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 181 +21: [2023-04-29 11:26:53,398] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt. +21: [2023-04-29 11:26:53,398] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 173 + 7: [2023-04-29 11:26:53,400] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt. + 7: [2023-04-29 11:26:53,400] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 57 +27: [2023-04-29 11:26:53,403] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 219 +22: [2023-04-29 11:26:53,405] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 181 +21: [2023-04-29 11:26:53,407] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 173 + 7: [2023-04-29 11:26:53,407] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 57 +31: [2023-04-29 11:26:53,417] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt. +31: [2023-04-29 11:26:53,417] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 253 +31: [2023-04-29 11:26:53,424] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 253 +13: [2023-04-29 11:26:53,429] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt. +13: [2023-04-29 11:26:53,429] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 111 + 2: [2023-04-29 11:26:53,431] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt. + 2: [2023-04-29 11:26:53,431] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 23 +13: [2023-04-29 11:26:53,437] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 111 + 8: [2023-04-29 11:26:53,437] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt. + 8: [2023-04-29 11:26:53,438] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 69 +13: [2023-04-29 11:26:53,438] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt. +13: [2023-04-29 11:26:53,438] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 107 + 2: [2023-04-29 11:26:53,441] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 23 +13: [2023-04-29 11:26:53,446] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 107 + 8: [2023-04-29 11:26:53,447] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 69 +13: [2023-04-29 11:26:53,453] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt. +13: [2023-04-29 11:26:53,454] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 109 +13: [2023-04-29 11:26:53,462] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 109 +22: [2023-04-29 11:26:53,470] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt. +22: [2023-04-29 11:26:53,470] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 177 +13: [2023-04-29 11:26:53,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt. +13: [2023-04-29 11:26:53,474] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 105 +29: [2023-04-29 11:26:53,474] [INFO] [torch_checkpoint_engine.py:23:load] [Torch] Loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt. +29: [2023-04-29 11:26:53,475] [INFO] [engine.py:2844:_get_all_zero_checkpoint_state_dicts] successfully read 128 ZeRO state_dicts for rank 233 +22: [2023-04-29 11:26:53,477] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 177 +13: [2023-04-29 11:26:53,482] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 105 +29: [2023-04-29 11:26:53,483] [INFO] [engine.py:2784:_load_zero_checkpoint] loading 128 zero partition checkpoints for rank 233 + 0: successfully loaded checkpoint from lm1-8b7-178b-c4-repetitions/8b7178b58b at iteration 0 +63: time (ms) | load-checkpoint: 13846.35 + 0: estimated model parameters: 8.905678848 + 0: estimated model parameters without embeddings: 8.458985472 + 0: [after model, optimizer, and learning rate scheduler are built] datetime: 2023-04-29 11:26:54 + 0: > building train, validation, and test datasets ... + 0: > datasets target sizes (minimum size): + 0: train: 1 + 0: validation: 51200 + 0: test: 51200 + 0: > building train, validation, and test datasets for GPT ... + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.049506 seconds + 0: number of documents: 835726 + 0: > dataset split: + 0: train: + 0: document indices in [0, 835726) total of 835726 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_400M_text_document_train_indexmap_1ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_400M_text_document_train_indexmap_1ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_subsampled/gpt2tok_c4_en_400M_text_document_train_indexmap_1ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.051 seconds + 0: total number of samples: 195101 + 0: total number of epochs: 1 + 0: > building dataset index ... + 0: reading sizes... + 0: reading pointers... + 0: reading document index... + 0: creating numpy buffer of mmap... + 0: creating memory view of numpy buffer... + 0: > finished creating indexed dataset in 0.033608 seconds + 0: number of documents: 364608 + 0: > dataset split: + 0: validation: + 0: document indices in [0, 364608) total of 364608 documents + 0: > loading doc-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_51200ns_2048sl_1234s_doc_idx.npy + 0: > loading sample-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_51200ns_2048sl_1234s_sample_idx.npy + 0: > loading shuffle-idx mapping from /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document_validation_indexmap_51200ns_2048sl_1234s_shuffle_idx.npy + 0: loaded indexed file in 0.090 seconds + 0: total number of samples: 84978 + 0: total number of epochs: 1 + 0: > finished creating GPT datasets ... + 0: [after dataloaders are built] datetime: 2023-04-29 11:27:01 + 0: done with setup ... + 0: training ... +63: time (ms) | model-and-optimizer-setup: 36839.41 | train/valid/test-data-iterators-setup: 6946.46 + 0: [after training is done] datetime: 2023-04-29 11:27:01 +63: ----------------------------------------------------------------------------------------------------------------- +63: validation loss at the end of training for val data | lm loss value: 2.348107E+00 | lm loss PPL: 1.046574E+01 | +63: ----------------------------------------------------------------------------------------------------------------- +END 3430964: Sat 29 Apr 2023 11:28:35 AM EEST